comparison qfilt.xml @ 1:2ab93e1952c5 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/qfilt commit c9f251e99e052ab4d87ed5fd89e466cdf387742b-dirty
author veg
date Wed, 18 Apr 2018 16:53:05 -0400
parents
children
comparison
equal deleted inserted replaced
0:5ac0ec2d69b2 1:2ab93e1952c5
1 <?xml version="1.0"?>
2 <tool id="qfilt" version="1.0.0" name="qfilt">
3 <description>filter sequencing data using simple heuristics</description>
4 <requirements>
5 <requirement type="package" version="0.0.1">qfilt</requirement>
6 </requirements>
7 <stdio>
8 <exit_code range="1:"/>
9 </stdio>
10 <command><![CDATA[
11 qfilt -o '$filtered_output'
12 #if str($options.advanced) == 'advanced':
13 -q $options.qscore -l $options.length
14 -s $options.split
15 #if $options.replace and $options.remove:
16 -P $options.replace -R $options.remove
17 #elif $options.mode:
18 -m $options.mode
19 #end if
20 #if $options.prefix:
21 -t $options.mismatch
22 -T $options.prefix
23 #end if
24 -f $options.format
25 $options.tolerate_homopolymeric $options.tolerate_ambiguous
26 #end if
27 -Q '$input_fastq'
28 ]]></command>
29 <inputs>
30
31 <param name="input_fastq" argument="-Q" type="data" format="fastq" label="Input FASTA" help="FASTQ File" />
32
33 <conditional name="options">
34
35 <param name="advanced" type="select" label="Additional options">
36 <option value="defaults">Use defaults</option>
37 <option value="advanced">Specify additional parameters</option>
38 </param>
39
40 <when value="defaults"/>
41
42 <when value="advanced">
43 <param name="qscore" argument="-q" type="integer" value="20" label="QScore" help="minimum per-base quality score below which a read will be split or truncated" />
44 <param name="length" argument="-l" type="integer" value="50" label="Length" help="minimum retained fragment LENGTH" />
45 <param name="mode" argument="-m" type="integer" value="0" label="Mode" help="MODE is a 3-bitmask (an integer in [0-7], default=0)" />
46 <param name="split" argument="-s" type="text" label="Split" help="when encountering a low q-score, split instead of truncate" />
47 <param name="tolerate_homopolymeric" argument="-p" type="boolean" truevalue="-p" falsevalue="" label="Tolerate Homopolymeric" help="tolerate low q-score homopolymeric regions" />
48 <param name="tolerate_ambiguous" argument="-a" type="boolean" truevalue="-a" falsevalue="" label="Tolerate Ambiguous" help="tolerate low q-score ambiguous nucleotides" />
49 <param name="replace" argument="-P" type="text" label="Replace" help="rather than splitting or truncating, replace low quality bases with CHAR this option OVERRIDES all -m mode options" />
50 <param name="remove" argument="-R" type="text" label="Remove" help="rather than splitting or truncating, remove reads which contain more than COUNT low quality bases this option only works in COMBINATION with the -P (punch) option" />
51 <param name="prefix" argument="-T" type="text" label="Prefix" help="if supplied, only reads with this PREFIX are retained, and the PREFIX is stripped from each contributing read" />
52 <param name="mismatch" argument="-t" type="integer" value="0" label="Mismatch" help="if PREFIX is supplied, prefix matching tolerates at most MISMATCH mismatches" />
53 <param name="format" argument="-f" type="select" label="Format" help="output in FASTA or FASTQ format (default=FASTA)" >
54 <option value="FASTA">FASTA</option>
55 <option value="FASTQ">FASTQ</option>
56 </param>
57 </when>
58
59 </conditional>
60
61 </inputs>
62 <outputs>
63 <data format="fasta" name="filtered_output"/>
64 </outputs>
65 <tests>
66 <test>
67 <param name="input_fastq" value="qfilt-in1.fastq" />
68 <output file="qfilt-out1.fa" ftype="fasta" name="filtered_output" />
69 </test>
70 <test>
71 <param name="input_fastq" value="qfilt-in1.fastq" />
72 <param name="advanced" value="advanced" />
73 <param name="tolerate_homopolymeric" value="False" />
74 <output file="qfilt-out2.fa" ftype="fasta" name="filtered_output" />
75 </test>
76 </tests>
77 <help><![CDATA[
78 qfilt
79 =====
80
81 This simple program is meant to filter sequencing data,
82 optionally removing or splitting reads with poor quality scores
83 and to optionally _only_ retain fragments from reads that are tagged with a given 5' sequence.
84
85 ### OUTPUT: ####
86
87 #### stderr: ####
88
89 run settings:
90 input fasta: data/test.fna
91 input qual: data/test.qual
92 min q-score: 15
93 min fragment length: 30
94 run mode: 0 (truncate/don't tolerate homopolymers/don't tolerate ambigs)
95 5' tag: ATATCGCGAGGA
96 max tag mismatches: 0
97
98 run summary:
99 total bases : 29570
100 original reads : 305
101 q10 : 0.995502
102 q20 : 0.860298
103 q30 : 0.728745
104 mean q-score : 33.2273
105 contributing reads: 5
106 retained fragments: 5
107
108 original read length distribution:
109 mean: 96.9508
110 median: 77
111 variance 3743.03
112 standard deviation: 61.1803
113 min: 49
114 2.5%: 54
115 97.5%: 332
116 max: 497
117
118 retained fragment length distribution:
119 mean: 41
120 median: 37
121 variance 72.5
122 standard deviation: 8.51469
123 min: 33
124 2.5%: 33
125 97.5%: 54
126 max: 54
127
128 #### stdout: ####
129
130 >GM98SRO01B77KU rank=0000671 x=796.0 y=1996.0 length=58
131 CCACGCGTATCGATGTCGACTTTTTTTTCTTTTCTTACATAGTAG
132 >GM98SRO01BA3RP rank=0000953 x=419.5 y=1603.5 length=87
133 CTGATGCTGCACCAACTGTACTCCCTCGCGATA
134 >GM98SRO01E1BKW rank=0001233 x=1948.0 y=846.0 length=66
135 TACAGTTGGTGCAGCATCAGAAAAGTACGACATCGATACGCGTGGTCCTCGCGA
136 >GM98SRO01DVVNY rank=0001304 x=1476.0 y=636.5 length=84
137 ACGGCTGATGCTGCACCAACTGTACTCCCTCGCGATA
138 >GM98SRO01D6FIX rank=0001416 x=1596.0 y=1415.0 length=91
139 CGGCTGATGCTGCACCAACTGTACTCCCTCGCGATA
140 ]]></help>
141 <citations>
142 <citation type="bibtex">
143 @UNPUBLISHED{spond,
144 author = "Sergei Kosakovsky Pond",
145 title = "HyPhy: Hypothesis Testing using Phylogenies",
146 year = "2000",
147 note = "http://hyphy.org/",
148 url = "http://hyphy.org/"}
149 </citation>
150 </citations>
151 </tool>