-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtermsuite_wrapper2_en.xml
60 lines (54 loc) · 1.98 KB
/
termsuite_wrapper2_en.xml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
<tool id="termsuite" name="Extract terminology" version="0.1.0">
<requirements>
<container type="docker">visatm/termsuite-wrapper</container>
</requirements>
<description>from a corpus of text files</description>
<command><![CDATA[
TermSuiteWrapper.sh -d /tmp/ts -f '$file_list' -l '$language' -o '$output'
#if $format == 'json':
-j '$json_output'
#elif $format == 'tsv':
-t '$tsv_output'
#end if
#if $memory
-x ${memory}m
#end if
]]></command>
<configfiles>
<configfile name="file_list">
#for $i in $inputs
${i.file_name}
#end for
</configfile>
</configfiles>
<inputs>
<param format="txt" name="inputs" type="data" multiple="true" label="Input text files" />
<param name="language" type="select" display="radio" label="Language of the input corpus">
<option value="en" selected="true">English</option>
<option value="fr">French</option>
</param>
<param name="format" type="select" display="radio" label="Output format">
<option value="tsv" selected="true">Extracted term list (TSV)</option>
<option value="json">TermSuite JSON file</option>
</param>
<param name="memory" type="integer" optional="true" label="Maximum memory allocation in MB (optional)" />
</inputs>
<outputs>
<data format="json" name="json_output" />
<data format="tabular" name="tsv_output" />
</outputs>
<tests>
<test>
<!-- param name="input" value="countWC_input.txt"/>
<output name="output" file="countWC_output.txt"/ -->
</test>
</tests>
<help><![CDATA[
This tool extracts a list of terms from a corpus of text files using the TermSuite_ software
and produces a putative terminology.
.. class:: warningmark
If you get an “*OutOfMemoryError*” message, you may increase the maximum size of memory allocated to the Java Virtual Machine.
The value expressed in megabytes must be a positive non-null integer.
.. _TermSuite: http://termsuite.github.io/
]]></help>
</tool>