Mercurial > repos > veg > qfilt
comparison qfilt.xml @ 1:2ab93e1952c5 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/qfilt commit c9f251e99e052ab4d87ed5fd89e466cdf387742b-dirty
| author | veg |
|---|---|
| date | Wed, 18 Apr 2018 16:53:05 -0400 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| 0:5ac0ec2d69b2 | 1:2ab93e1952c5 |
|---|---|
| 1 <?xml version="1.0"?> | |
| 2 <tool id="qfilt" version="1.0.0" name="qfilt"> | |
| 3 <description>filter sequencing data using simple heuristics</description> | |
| 4 <requirements> | |
| 5 <requirement type="package" version="0.0.1">qfilt</requirement> | |
| 6 </requirements> | |
| 7 <stdio> | |
| 8 <exit_code range="1:"/> | |
| 9 </stdio> | |
| 10 <command><![CDATA[ | |
| 11 qfilt -o '$filtered_output' | |
| 12 #if str($options.advanced) == 'advanced': | |
| 13 -q $options.qscore -l $options.length | |
| 14 -s $options.split | |
| 15 #if $options.replace and $options.remove: | |
| 16 -P $options.replace -R $options.remove | |
| 17 #elif $options.mode: | |
| 18 -m $options.mode | |
| 19 #end if | |
| 20 #if $options.prefix: | |
| 21 -t $options.mismatch | |
| 22 -T $options.prefix | |
| 23 #end if | |
| 24 -f $options.format | |
| 25 $options.tolerate_homopolymeric $options.tolerate_ambiguous | |
| 26 #end if | |
| 27 -Q '$input_fastq' | |
| 28 ]]></command> | |
| 29 <inputs> | |
| 30 | |
| 31 <param name="input_fastq" argument="-Q" type="data" format="fastq" label="Input FASTA" help="FASTQ File" /> | |
| 32 | |
| 33 <conditional name="options"> | |
| 34 | |
| 35 <param name="advanced" type="select" label="Additional options"> | |
| 36 <option value="defaults">Use defaults</option> | |
| 37 <option value="advanced">Specify additional parameters</option> | |
| 38 </param> | |
| 39 | |
| 40 <when value="defaults"/> | |
| 41 | |
| 42 <when value="advanced"> | |
| 43 <param name="qscore" argument="-q" type="integer" value="20" label="QScore" help="minimum per-base quality score below which a read will be split or truncated" /> | |
| 44 <param name="length" argument="-l" type="integer" value="50" label="Length" help="minimum retained fragment LENGTH" /> | |
| 45 <param name="mode" argument="-m" type="integer" value="0" label="Mode" help="MODE is a 3-bitmask (an integer in [0-7], default=0)" /> | |
| 46 <param name="split" argument="-s" type="text" label="Split" help="when encountering a low q-score, split instead of truncate" /> | |
| 47 <param name="tolerate_homopolymeric" argument="-p" type="boolean" truevalue="-p" falsevalue="" label="Tolerate Homopolymeric" help="tolerate low q-score homopolymeric regions" /> | |
| 48 <param name="tolerate_ambiguous" argument="-a" type="boolean" truevalue="-a" falsevalue="" label="Tolerate Ambiguous" help="tolerate low q-score ambiguous nucleotides" /> | |
| 49 <param name="replace" argument="-P" type="text" label="Replace" help="rather than splitting or truncating, replace low quality bases with CHAR this option OVERRIDES all -m mode options" /> | |
| 50 <param name="remove" argument="-R" type="text" label="Remove" help="rather than splitting or truncating, remove reads which contain more than COUNT low quality bases this option only works in COMBINATION with the -P (punch) option" /> | |
| 51 <param name="prefix" argument="-T" type="text" label="Prefix" help="if supplied, only reads with this PREFIX are retained, and the PREFIX is stripped from each contributing read" /> | |
| 52 <param name="mismatch" argument="-t" type="integer" value="0" label="Mismatch" help="if PREFIX is supplied, prefix matching tolerates at most MISMATCH mismatches" /> | |
| 53 <param name="format" argument="-f" type="select" label="Format" help="output in FASTA or FASTQ format (default=FASTA)" > | |
| 54 <option value="FASTA">FASTA</option> | |
| 55 <option value="FASTQ">FASTQ</option> | |
| 56 </param> | |
| 57 </when> | |
| 58 | |
| 59 </conditional> | |
| 60 | |
| 61 </inputs> | |
| 62 <outputs> | |
| 63 <data format="fasta" name="filtered_output"/> | |
| 64 </outputs> | |
| 65 <tests> | |
| 66 <test> | |
| 67 <param name="input_fastq" value="qfilt-in1.fastq" /> | |
| 68 <output file="qfilt-out1.fa" ftype="fasta" name="filtered_output" /> | |
| 69 </test> | |
| 70 <test> | |
| 71 <param name="input_fastq" value="qfilt-in1.fastq" /> | |
| 72 <param name="advanced" value="advanced" /> | |
| 73 <param name="tolerate_homopolymeric" value="False" /> | |
| 74 <output file="qfilt-out2.fa" ftype="fasta" name="filtered_output" /> | |
| 75 </test> | |
| 76 </tests> | |
| 77 <help><![CDATA[ | |
| 78 qfilt | |
| 79 ===== | |
| 80 | |
| 81 This simple program is meant to filter sequencing data, | |
| 82 optionally removing or splitting reads with poor quality scores | |
| 83 and to optionally _only_ retain fragments from reads that are tagged with a given 5' sequence. | |
| 84 | |
| 85 ### OUTPUT: #### | |
| 86 | |
| 87 #### stderr: #### | |
| 88 | |
| 89 run settings: | |
| 90 input fasta: data/test.fna | |
| 91 input qual: data/test.qual | |
| 92 min q-score: 15 | |
| 93 min fragment length: 30 | |
| 94 run mode: 0 (truncate/don't tolerate homopolymers/don't tolerate ambigs) | |
| 95 5' tag: ATATCGCGAGGA | |
| 96 max tag mismatches: 0 | |
| 97 | |
| 98 run summary: | |
| 99 total bases : 29570 | |
| 100 original reads : 305 | |
| 101 q10 : 0.995502 | |
| 102 q20 : 0.860298 | |
| 103 q30 : 0.728745 | |
| 104 mean q-score : 33.2273 | |
| 105 contributing reads: 5 | |
| 106 retained fragments: 5 | |
| 107 | |
| 108 original read length distribution: | |
| 109 mean: 96.9508 | |
| 110 median: 77 | |
| 111 variance 3743.03 | |
| 112 standard deviation: 61.1803 | |
| 113 min: 49 | |
| 114 2.5%: 54 | |
| 115 97.5%: 332 | |
| 116 max: 497 | |
| 117 | |
| 118 retained fragment length distribution: | |
| 119 mean: 41 | |
| 120 median: 37 | |
| 121 variance 72.5 | |
| 122 standard deviation: 8.51469 | |
| 123 min: 33 | |
| 124 2.5%: 33 | |
| 125 97.5%: 54 | |
| 126 max: 54 | |
| 127 | |
| 128 #### stdout: #### | |
| 129 | |
| 130 >GM98SRO01B77KU rank=0000671 x=796.0 y=1996.0 length=58 | |
| 131 CCACGCGTATCGATGTCGACTTTTTTTTCTTTTCTTACATAGTAG | |
| 132 >GM98SRO01BA3RP rank=0000953 x=419.5 y=1603.5 length=87 | |
| 133 CTGATGCTGCACCAACTGTACTCCCTCGCGATA | |
| 134 >GM98SRO01E1BKW rank=0001233 x=1948.0 y=846.0 length=66 | |
| 135 TACAGTTGGTGCAGCATCAGAAAAGTACGACATCGATACGCGTGGTCCTCGCGA | |
| 136 >GM98SRO01DVVNY rank=0001304 x=1476.0 y=636.5 length=84 | |
| 137 ACGGCTGATGCTGCACCAACTGTACTCCCTCGCGATA | |
| 138 >GM98SRO01D6FIX rank=0001416 x=1596.0 y=1415.0 length=91 | |
| 139 CGGCTGATGCTGCACCAACTGTACTCCCTCGCGATA | |
| 140 ]]></help> | |
| 141 <citations> | |
| 142 <citation type="bibtex"> | |
| 143 @UNPUBLISHED{spond, | |
| 144 author = "Sergei Kosakovsky Pond", | |
| 145 title = "HyPhy: Hypothesis Testing using Phylogenies", | |
| 146 year = "2000", | |
| 147 note = "http://hyphy.org/", | |
| 148 url = "http://hyphy.org/"} | |
| 149 </citation> | |
| 150 </citations> | |
| 151 </tool> |
