diff g_collocation.xml @ 0:e991d4e60c17 draft

planemo upload commit 0203cb3a0b40d9348674b2b098af805e2986abca-dirty
author stevecassidy
date Wed, 12 Oct 2016 22:17:53 -0400
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/g_collocation.xml	Wed Oct 12 22:17:53 2016 -0400
@@ -0,0 +1,38 @@
+<tool id="Collocation" name="Collocation" version="1.0">
+    <description>Generates a list of the most frequent collocations from an input sequence</description>
+    <requirements>
+        <requirement type="package" version="3.2.1">nltk</requirement>
+    </requirements>
+
+    <command interpreter="python">
+        g_collocation.py --input $input1 --output $tab_file --freq_filter $freq_filter --results $results --coll_type $collocation_type --pos $pos
+    </command>
+
+    <inputs>
+        <param name="input1" type="data" format="txt" label="Select a suitable input file from your history"/>
+        <param name="job_name" type="text" size="25"
+               label="Supply a name for the outputs to remind you what they contain" value="Collocation"/>
+        <param name="freq_filter" type="integer" label="The minimum number of required occurrences in the corpus"
+               value="0"/>
+        <param name="results" type="integer" label="The maximum number of collocations to show in the results"
+               value="10"/>
+        <param name="collocation_type" type="select" label="" display="radio">
+            <option value="bigram">Bigram Collocations</option>
+            <option value="trigram">Trigram Collocations</option>
+        </param>
+        <param name="pos" type="boolean" label="Data input is a set of POS tags"/>
+    </inputs>
+    <outputs>
+        <data format="tabular" name="tab_file" label="${job_name}"/>
+
+    </outputs>
+    <options refresh="True"/>
+    <help>
+        <![CDATA[
+
+Input is a text, optionally with POS tags. Output is a list of the top N collocations ordered by frequency.
+
+]]>
+
+    </help>
+</tool>