diff sequence2gspan.xml @ 0:b01beb170290 draft default tip

Uploaded
author bgruening
date Tue, 29 Oct 2013 11:10:19 -0400
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/sequence2gspan.xml	Tue Oct 29 11:10:19 2013 -0400
@@ -0,0 +1,167 @@
+<tool id="sequence2gpsan_rnashapes" name="Sequence to gspan" version="0.3">
+    <description>converter using RNAshapes</description>
+    <parallelism method="multi" split_inputs="infile" split_mode="to_size" split_size="10" shared_inputs="" merge_outputs="outfile"></parallelism>
+    <requirements>
+        <requirement type="package" version="2.1.6">rnashapes</requirement>
+    </requirements>
+    <command interpreter="perl">
+
+        fasta2shrep_gspan.pl
+            --fasta $infile
+
+            #if $annotate_infile:
+                -annotate $annotate_infile
+            #end if
+
+            -shift $shift
+            $cue
+            $stack
+            #if $energy_opts.energy_opts_selector == 'energy':
+                -e $energy_opts.e
+            #elif $energy_opts.energy_opts_selector == 'rel_energy':
+                -c $energy_opts.c
+            #end if
+
+            #if $structure_sampling_opts.structure_sampling_opts_selector == 'on':
+                -i $structure_sampling_opts.i
+                -sample_len $structure_sampling_opts.sample_len
+            #end if
+
+            $q
+            -Tp $Tp
+            $seq_graph_win
+            $seq_graph_t
+            $seq_graph_alph
+            $abstr
+            $nostr
+            $vp
+            $ignore_header
+            -M $M
+            $u
+            $r
+
+            -stdout
+
+            > $output
+
+    </command>
+    <inputs>
+        <param name="ifile" type="data" format="fasta" label="Nucleotide Sequence in FASTA format"/>
+
+        <!-- todo repeat tag, normally only 3 windows are specified-->
+        <param name="wins" type="text" value="" label="A list of window sizes to use"
+            help="if none are given, then the entire sequence is taken with no windows. Each window > 1 required! Example: 50,100,200. (-wins)" />
+        <param name="t" type="text" value="3=0" label="The shape type (RNAshapes types from 1-5)"
+            help="With the list format, the shape level can be changed for different window length '4=100' means that shape level 4 is used from length 100nt (window length) The first given length has to be 0! Not continuous given levels are allowed! (-t)" />
+
+
+        <param name="shift" type="integer" value="1" label="The shift of the window, relative to the window size given in percent" 
+            help="Example 20 % of a window 150 would result in a step size of 30 nt. It is a relative parameter, as you can give different window sizes. Default shift of 1 nt. (-shift)">
+            <validator type="in_range" min="0" max="100" />
+        </param>
+        <param name="cue" type="boolean" label="Crop unpaired ends" truevalue="-cue" falsevalue="" checked="false" 
+            help="If you give this flag, then the unpaired ends of each single structure are ignored. E.g. the structure ...(((...))).. becomes just (((...))). (-cue)" />
+
+        <param name="stack" type="boolean" label="Adds stacking information to graphs" truevalue="-stack" falsevalue="" checked="false" 
+            help="This adds an additional vertex (type P) for each pair of stacked base-pairs and four edges (type p) from each of the involved bases to the new vertex. (-stack)" />
+
+        <conditional name="energy_opts">
+            <param name="energy_opts_selector" type="select" label="Energy calculation mode">
+                <option value="rel_energy">Relative energy range, i.e. percentage (%) of MFE energy (RNAshapes)</option>
+                <option value="energy">Energy range in kcal/mol (RNAshapes)</option>
+                <option value="">None</option>
+            </param>
+            <when value="" />
+            <when value="energy">
+                <param name="e" type="float" value="5.0" label="Energy range in kcal/mol (RNAshapes)" help="-e">
+                    <validator type="in_range" min="0.0" />
+                </param>
+            </when>
+            <when value="rel_energy">
+                <param name="c" type="float" value="10" label="Relative energy range, i.e. percentage (%) of MFE energy (RNAshapes)" help="(-c)">
+                    <validator type="in_range" min="0.0" />
+                </param>
+            </when>
+        </conditional>
+        <param name="M" type="integer" value="0" label="Max number of shreps that should be taken per window" help="0 means selects all shreps. (-M)">
+            <validator type="in_range" min="0" />
+        </param>
+        <param name="u" type="boolean" label="Ignore unstable RNAshapes" truevalue="-u" falsevalue="" checked="false" 
+            help="This option filters out closed structures with positive free energy. (-u)" />
+
+        <param name="r" type="boolean" label="Calculate structure probabilities for RNAshapes" help="(-r)" truevalue="-r" falsevalue="" checked="false" />
+
+
+        <conditional name="structure_sampling_opts">
+            <param name="structure_sampling_opts_selector" type="select" label="Structure Sampling">
+                <option value="on">On</option>
+                <option value="off">Off</option>
+            </param>
+            <when value="on">
+                <param name="i" type="integer" value="1" label="Number of sampling iterations" help="(-i)">
+                    <validator type="in_range" min="1" />
+                </param>
+                <param name="smaple_len" type="integer" value="0" label="Sampling is only used for seqs/windows >= given length" help="Default 0 (sample all length). (-sample-len)">
+                    <validator type="in_range" min="0" />
+                </param>
+            </when>
+            <when value="off" />
+        </conditional>
+
+        <param name="q" type="boolean" label="Turn on shape probabilities for RNAshapes, no sampling mode allowed" help="(-q)" truevalue="-q" falsevalue="" checked="false" />
+        <param name="Tp" type="float" value="0.001" label="Filter cutoff for shape probabilities, applied before -M filter!" help="(-Tp)">
+            <validator type="in_range" min="0.0" />
+        </param>
+
+        <param name="seq_graph_win" type="boolean" label="Add for each window a graph which contains no structure" 
+            help="(-seq-graph-win)" 
+            truevalue="-seq-graph-win" falsevalue="" checked="false" />
+        <param name="seq_graph_t" type="boolean" label="add for each 't #' a graph which contains no structure" 
+            help="(-seq-graph-t)" 
+            truevalue="-seq-graph-t" falsevalue="" checked="false" />
+        <param name="seq_graph_alph" type="boolean" label="Change the alphabet of unstructured graphs" 
+            help="(-seq-graph-alph)" 
+            truevalue="-seq-graph-alph" falsevalue="" checked="false" />
+
+        <param format="tabular" name="annotate_infile" type="data" optional="True" label="A file with annotations to be added as abstract graphs" 
+            help="The format is has the following TAB-delimited columns: SEQID, START, END, NAMESPACE#LABEL. Labels with the same name-space and SEQID form connected components, which is a sequence of label vertices ordered by the START position in the sequence."/>
+
+        <param name="abstr" type="boolean" label="Add abstract structure graphs to the single shrep graph instances" 
+            help="(-abstr)" 
+            truevalue="-abstr" falsevalue="" checked="false" />
+        <param name="nostr" type="boolean" label="Calculate no structures, only add sequence information" 
+            help="-seq-graph-win AND/OR -seq-graph-t are required (-nostr)" 
+            truevalue="-nostr" falsevalue="" checked="false" />
+
+        <!--
+            -match-shape    SHAPE
+            all seqs/windows will be constraint folded into that shape via 
+            RNAshapes (if structure is given in another way this struct will be kept), 
+            if this shape is not possible within given energy range, produce a 
+            specific t graph with only one vertex 'X'. By this the instance 
+            becomes very unsimilar to all other graphs (for knn)
+        -->
+        <param name="vp" type="boolean" label="Enable graph computation with viewpoints" 
+            help="svmsgdnspdk will center on those nucleotides that are given via capital letters and ignore those given as lowercase letters (-vp)" 
+            truevalue="-vp" falsevalue="" checked="false" />
+
+        <param name="ignore_header" type="boolean" label="Don't write fasta id part after first space to gspan" help="(-ignore-header)" truevalue="-ignore-header" falsevalue="" checked="false" />
+
+    </inputs>
+    <outputs>
+        <data format="gspan" name="output" label="${tool.name} on ${on_string}" />
+    </outputs>
+    <tests>
+    </tests>
+    <help>
+
+**What it does**
+
+
+
+**References**
+
+Sita et al...
+
+    </help>
+</tool>