annotate fastq_filter.xml @ 0:0017fa63af6c draft

Imported from capsule None
author devteam
date Thu, 23 Jan 2014 12:31:42 -0500
parents
children a30fc80df16c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
1 <tool id="fastq_filter" name="Filter FASTQ" version="1.0.0">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
2 <description>reads by quality score and length</description>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
3 <requirements>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
4 <requirement type="package" version="1.0.0">galaxy_sequence_utils</requirement>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
5 </requirements>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
6 <command interpreter="python">fastq_filter.py $input_file $fastq_filter_file $output_file $output_file.files_path '${input_file.extension[len( 'fastq' ):]}'</command>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
7 <inputs>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
8 <page>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
9 <param name="input_file" type="data" format="fastqsanger,fastqcssanger" label="FASTQ File" help="Requires groomed data: if your data does not appear here try using the FASTQ groomer."/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
10 <param name="min_size" label="Minimum Size" value="0" type="integer">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
11 <validator type="in_range" message="Minimum size must be positive" min="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
12 </param>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
13 <param name="max_size" label="Maximum Size" value="0" type="integer" help="A maximum size less than 1 indicates no limit."/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
14 <param name="min_quality" label="Minimum Quality" value="0" type="float"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
15 <param name="max_quality" label="Maximum Quality" value="0" type="float" help="A maximum quality less than 1 indicates no limit."/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
16 <param name="max_num_deviants" label="Maximum number of bases allowed outside of quality range" value="0" type="integer">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
17 <validator type="in_range" message="Maximum number of deviate bases must be positive" min="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
18 </param>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
19 <param name="paired_end" label="This is paired end data" type="boolean" truevalue="paired_end" falsevalue="single_end" checked="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
20 <repeat name="fastq_filters" title="Quality Filter on a Range of Bases" help="The above settings do not apply to these filters.">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
21 <conditional name="offset_type">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
22 <param name="base_offset_type" type="select" label="Define Base Offsets as" help="Use Absolute for fixed length reads (Illumina, SOLiD)&lt;br&gt;Use Percentage for variable length reads (Roche/454)">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
23 <option value="offsets_absolute" selected="true">Absolute Values</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
24 <option value="offsets_percent">Percentage of Read Length</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
25 </param>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
26 <when value="offsets_absolute">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
27 <param name="left_column_offset" label="Offset from 5' end" value="0" type="integer" help="Values start at 0, increasing from the left">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
28 <validator type="in_range" message="Base Offsets must be positive" min="0" max="inf"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
29 <validator type="expression" message="An integer is required.">int( float( value ) ) == float( value )</validator>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
30 </param>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
31 <param name="right_column_offset" label="Offset from 3' end" value="0" type="integer" help="Values start at 0, increasing from the right">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
32 <validator type="in_range" message="Base Offsets must be positive" min="0" max="inf"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
33 <validator type="expression" message="An integer is required.">int( float( value ) ) == float( value )</validator>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
34 </param>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
35 </when>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
36 <when value="offsets_percent">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
37 <param name="left_column_offset" label="Offset from 5' end" value="0" type="float">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
38 <validator type="in_range" message="Base Offsets must be between 0 and 100" min="0" max="100"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
39 </param>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
40 <param name="right_column_offset" label="Offset from 3' end" value="0" type="float">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
41 <validator type="in_range" message="Base Offsets must be between 0 and 100" min="0" max="100"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
42 </param>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
43 </when>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
44 </conditional>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
45 <param name="score_operation" type="select" label="Aggregate read score for specified range">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
46 <option value="min" selected="True">min score</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
47 <option value="max">max score</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
48 <option value="sum">sum of scores</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
49 <option value="mean">mean of scores</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
50 </param>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
51 <param name="score_comparison" type="select" label="Keep read when aggregate score is">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
52 <option value="&gt;">&gt;</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
53 <option value="&gt;=" selected="true">&gt;=</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
54 <option value="==">==</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
55 <option value="&lt;">&lt;</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
56 <option value="&lt;=">&lt;=</option>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
57 <sanitizer sanitize="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
58 </param>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
59 <param name="score" label="Quality Score" value="0" type="float" />
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
60 </repeat>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
61 </page>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
62 </inputs>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
63 <configfiles>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
64 <configfile name="fastq_filter_file">
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
65 def fastq_read_pass_filter( fastq_read ):
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
66 def mean( score_list ):
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
67 return float( sum( score_list ) ) / float( len( score_list ) )
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
68 if len( fastq_read ) &lt; $min_size:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
69 return False
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
70 if $max_size &gt; 0 and len( fastq_read ) &gt; $max_size:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
71 return False
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
72 num_deviates = $max_num_deviants
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
73 qual_scores = fastq_read.get_decimal_quality_scores()
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
74 for qual_score in qual_scores:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
75 if qual_score &lt; $min_quality or ( $max_quality &gt; 0 and qual_score &gt; $max_quality ):
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
76 if num_deviates == 0:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
77 return False
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
78 else:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
79 num_deviates -= 1
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
80 #if not $paired_end:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
81 qual_scores_split = [ qual_scores ]
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
82 #else:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
83 qual_scores_split = [ qual_scores[ 0:int( len( qual_scores ) / 2 ) ], qual_scores[ int( len( qual_scores ) / 2 ): ] ]
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
84 #end if
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
85 #for $fastq_filter in $fastq_filters:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
86 for split_scores in qual_scores_split:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
87 left_column_offset = $fastq_filter[ 'offset_type' ][ 'left_column_offset' ]
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
88 right_column_offset = $fastq_filter[ 'offset_type' ][ 'right_column_offset' ]
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
89 #if $fastq_filter[ 'offset_type' ]['base_offset_type'] == 'offsets_percent':
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
90 left_column_offset = int( round( float( left_column_offset ) / 100.0 * float( len( split_scores ) ) ) )
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
91 right_column_offset = int( round( float( right_column_offset ) / 100.0 * float( len( split_scores ) ) ) )
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
92 #end if
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
93 if right_column_offset > 0:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
94 split_scores = split_scores[ left_column_offset:-right_column_offset]
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
95 else:
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
96 split_scores = split_scores[ left_column_offset:]
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
97 if split_scores: ##if a read doesn't have enough columns, it passes by default
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
98 if not ( ${fastq_filter[ 'score_operation' ]}( split_scores ) $fastq_filter[ 'score_comparison' ] $fastq_filter[ 'score' ] ):
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
99 return False
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
100 #end for
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
101 return True
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
102 </configfile>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
103 </configfiles>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
104 <outputs>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
105 <data format="input" name="output_file" />
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
106 </outputs>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
107 <tests>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
108 <!-- Do nothing filter -->
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
109 <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
110 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
111 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
112 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
113 <param name="min_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
114 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
115 <param name="max_num_deviants" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
116 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
117 <param name="base_offset_type" value="offsets_absolute"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
118 <param name="left_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
119 <param name="right_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
120 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
121 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
122 <param name="score" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
123 <output name="out_file1" file="sanger_full_range_original_sanger.fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
124 </test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
125 <!-- crippled input types prevent this test <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
126 <param name="input_file" value="solexa_full_range_original_solexa.fastqsolexa" ftype="fastqsolexa"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
127 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
128 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
129 <param name="min_quality" value="-5"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
130 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
131 <param name="max_num_deviants" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
132 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
133 <param name="base_offset_type" value="offsets_absolute"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
134 <param name="left_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
135 <param name="right_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
136 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
137 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
138 <param name="score" value="-5"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
139 <output name="out_file1" file="solexa_full_range_original_solexa.fastqsolexa"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
140 </test> -->
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
141 <!-- No trim, so does not remove Adapter from cssanger -->
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
142 <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
143 <param name="input_file" value="sanger_full_range_as_cssanger.fastqcssanger" ftype="fastqcssanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
144 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
145 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
146 <param name="min_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
147 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
148 <param name="max_num_deviants" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
149 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
150 <param name="base_offset_type" value="offsets_absolute"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
151 <param name="left_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
152 <param name="right_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
153 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
154 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
155 <param name="score" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
156 <output name="out_file1" file="sanger_full_range_as_cssanger.fastqcssanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
157 </test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
158 <!-- Remove all Filter -->
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
159 <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
160 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
161 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
162 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
163 <param name="min_quality" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
164 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
165 <param name="max_num_deviants" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
166 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
167 <param name="base_offset_type" value="offsets_absolute"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
168 <param name="left_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
169 <param name="right_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
170 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
171 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
172 <param name="score" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
173 <output name="out_file1" file="empty_file.dat"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
174 </test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
175 <!-- crippled input types prevent this test <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
176 <param name="input_file" value="solexa_full_range_original_solexa.fastqsolexa" ftype="fastqsolexa"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
177 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
178 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
179 <param name="min_quality" value="-4"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
180 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
181 <param name="max_num_deviants" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
182 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
183 <param name="base_offset_type" value="offsets_absolute"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
184 <param name="left_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
185 <param name="right_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
186 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
187 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
188 <param name="score" value="-5"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
189 <output name="out_file1" file="empty_file.dat"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
190 </test> -->
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
191 <!-- Keep all by allowing 1 deviant -->
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
192 <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
193 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
194 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
195 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
196 <param name="min_quality" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
197 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
198 <param name="max_num_deviants" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
199 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
200 <param name="base_offset_type" value="offsets_absolute"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
201 <param name="left_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
202 <param name="right_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
203 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
204 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
205 <param name="score" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
206 <output name="out_file1" file="sanger_full_range_original_sanger.fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
207 </test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
208 <!-- crippled input types prevent this test<test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
209 <param name="input_file" value="solexa_full_range_original_solexa.fastqsolexa" ftype="fastqsolexa"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
210 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
211 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
212 <param name="min_quality" value="-5"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
213 <param name="max_quality" value="61"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
214 <param name="max_num_deviants" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
215 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
216 <param name="base_offset_type" value="offsets_absolute"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
217 <param name="left_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
218 <param name="right_column_offset" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
219 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
220 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
221 <param name="score" value="-5"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
222 <output name="out_file1" file="solexa_full_range_original_solexa.fastqsolexa"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
223 </test> -->
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
224 <!-- Filter inner range -->
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
225 <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
226 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
227 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
228 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
229 <param name="min_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
230 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
231 <param name="max_num_deviants" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
232 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
233 <param name="base_offset_type" value="offsets_absolute"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
234 <param name="left_column_offset" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
235 <param name="right_column_offset" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
236 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
237 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
238 <param name="score" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
239 <output name="out_file1" file="sanger_full_range_original_sanger.fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
240 </test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
241 <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
242 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
243 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
244 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
245 <param name="min_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
246 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
247 <param name="max_num_deviants" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
248 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
249 <param name="base_offset_type" value="offsets_absolute"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
250 <param name="left_column_offset" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
251 <param name="right_column_offset" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
252 <param name="score_operation" value="max"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
253 <param name="score_comparison" value="&lt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
254 <param name="score" value="92"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
255 <output name="out_file1" file="sanger_full_range_original_sanger.fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
256 </test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
257 <!-- percent based offsets -->
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
258 <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
259 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
260 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
261 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
262 <param name="min_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
263 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
264 <param name="max_num_deviants" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
265 <param name="paired_end" value="False"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
266 <param name="base_offset_type" value="offsets_percent"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
267 <param name="left_column_offset" value="1.075"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
268 <param name="right_column_offset" value="1.075"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
269 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
270 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
271 <param name="score" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
272 <output name="out_file1" file="sanger_full_range_original_sanger.fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
273 </test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
274 <test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
275 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
276 <param name="min_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
277 <param name="max_size" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
278 <param name="min_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
279 <param name="max_quality" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
280 <param name="max_num_deviants" value="0"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
281 <param name="paired_end" value="True"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
282 <param name="base_offset_type" value="offsets_percent"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
283 <param name="left_column_offset" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
284 <param name="right_column_offset" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
285 <param name="score_operation" value="min"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
286 <param name="score_comparison" value="&gt;="/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
287 <param name="score" value="1"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
288 <output name="out_file1" file="empty_file.dat"/>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
289 </test>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
290 </tests>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
291 <help>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
292 This tool allows you to build complex filters to be applied to each read in a FASTQ file.
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
293
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
294 **Basic Options:**
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
295 * You can specify a minimum and maximum read lengths.
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
296 * You can specify minimum and maximum per base quality scores, with optionally specifying the number of bases that are allowed to deviate from this range (default of 0 deviant bases).
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
297 * If your data is paired-end, select the proper checkbox; this will cause each read to be internally split down the middle and filters applied to each half using the offsets specified.
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
298
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
299 **Advance Options:**
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
300 * You can specify any number of advanced filters.
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
301 * 5' and 3' offsets are defined, starting at zero, increasing from the respective end of the reads. For example, a quality string of "ABCDEFG", with 5' and 3' offsets of 1 and 1, respectively, specified will yield "BCDEF".
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
302 * You can specify either absolute offset values, or percentage offset values. *Absolute Values* based offsets are useful for fixed length reads (e.g. Illumina or SOLiD data). *Percentage of Read Length* based offsets are useful for variable length reads (e.g. 454 data). When using the percent-based method, offsets are rounded to the nearest integer.
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
303 * The user specifies the aggregating action (min, max, sum, mean) to perform on the quality score values found between the specified offsets to be used with the user defined comparison operation and comparison value.
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
304 * If a set of offsets is specified that causes the remaining quality score list to be of length zero, then the read will **pass** the quality filter unless the size range filter is used to remove these reads.
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
305
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
306 -----
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
307
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
308 .. class:: warningmark
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
309
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
310 Adapter bases in color space reads are excluded from filtering.
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
311
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
312 ------
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
313
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
314 **Citation**
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
315
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
316 If you use this tool, please cite `Blankenberg D, Gordon A, Von Kuster G, Coraor N, Taylor J, Nekrutenko A; Galaxy Team. Manipulation of FASTQ data with Galaxy. Bioinformatics. 2010 Jul 15;26(14):1783-5. &lt;http://www.ncbi.nlm.nih.gov/pubmed/20562416&gt;`_
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
317
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
318
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
319 </help>
0017fa63af6c Imported from capsule None
devteam
parents:
diff changeset
320 </tool>