annotate bismark_bowtie_wrapper.xml @ 9:221e740377ca draft

Uploaded
author bgruening
date Tue, 13 Nov 2012 13:30:32 -0500
parents
children 73508c5b4273
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
9
221e740377ca Uploaded
bgruening
parents:
diff changeset
1 <tool id="bismark_bowtie" name="Bismark" version="0.7.7.2">
221e740377ca Uploaded
bgruening
parents:
diff changeset
2 <!-- Wrapper compatible with Bismark version 0.7.7 -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
3 <description>bisulfite mapper (bowtie)</description>
221e740377ca Uploaded
bgruening
parents:
diff changeset
4 <!--<version_command>bismark version</version_command>-->
221e740377ca Uploaded
bgruening
parents:
diff changeset
5 <requirements>
221e740377ca Uploaded
bgruening
parents:
diff changeset
6 <requirement type="set_environment">SCRIPT_PATH</requirement>
221e740377ca Uploaded
bgruening
parents:
diff changeset
7 <requirement type="package" version="0.12.8">bowtie</requirement>
221e740377ca Uploaded
bgruening
parents:
diff changeset
8 <requirement type="package" version="2.0.0-beta7">bowtie2</requirement>
221e740377ca Uploaded
bgruening
parents:
diff changeset
9 </requirements>
221e740377ca Uploaded
bgruening
parents:
diff changeset
10 <parallelism method="basic"></parallelism>
221e740377ca Uploaded
bgruening
parents:
diff changeset
11 <command interpreter="python">
221e740377ca Uploaded
bgruening
parents:
diff changeset
12 bismark_wrapper.py
221e740377ca Uploaded
bgruening
parents:
diff changeset
13
221e740377ca Uploaded
bgruening
parents:
diff changeset
14 ## Change this to accommodate the number of threads you have available.
221e740377ca Uploaded
bgruening
parents:
diff changeset
15 --num-threads 4
221e740377ca Uploaded
bgruening
parents:
diff changeset
16
221e740377ca Uploaded
bgruening
parents:
diff changeset
17 --bismark_path \$SCRIPT_PATH
221e740377ca Uploaded
bgruening
parents:
diff changeset
18
221e740377ca Uploaded
bgruening
parents:
diff changeset
19 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
20 ## Bismark Genome Preparation, if desired.
221e740377ca Uploaded
bgruening
parents:
diff changeset
21 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
22
221e740377ca Uploaded
bgruening
parents:
diff changeset
23 ## Handle reference file.
221e740377ca Uploaded
bgruening
parents:
diff changeset
24 #if $refGenomeSource.genomeSource == "history":
221e740377ca Uploaded
bgruening
parents:
diff changeset
25 --own-file=$refGenomeSource.ownFile
221e740377ca Uploaded
bgruening
parents:
diff changeset
26 #else:
221e740377ca Uploaded
bgruening
parents:
diff changeset
27 --indexes-path ${refGenomeSource.index.fields.path}
221e740377ca Uploaded
bgruening
parents:
diff changeset
28 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
29
221e740377ca Uploaded
bgruening
parents:
diff changeset
30
221e740377ca Uploaded
bgruening
parents:
diff changeset
31 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
32 ## Input parameters
221e740377ca Uploaded
bgruening
parents:
diff changeset
33 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
34
221e740377ca Uploaded
bgruening
parents:
diff changeset
35
221e740377ca Uploaded
bgruening
parents:
diff changeset
36 #if $singlePaired.sPaired == "single":
221e740377ca Uploaded
bgruening
parents:
diff changeset
37 --single-paired $singlePaired.input_singles
221e740377ca Uploaded
bgruening
parents:
diff changeset
38
221e740377ca Uploaded
bgruening
parents:
diff changeset
39 #if $singlePaired.input_singles.ext == "fastqillumina":
221e740377ca Uploaded
bgruening
parents:
diff changeset
40 --phred64-quals
221e740377ca Uploaded
bgruening
parents:
diff changeset
41 --fastq
221e740377ca Uploaded
bgruening
parents:
diff changeset
42 #elif $singlePaired.input_singles.ext == "fastqsanger":
221e740377ca Uploaded
bgruening
parents:
diff changeset
43 --fastq
221e740377ca Uploaded
bgruening
parents:
diff changeset
44 #elif $singlePaired.input_singles.ext == "fasta":
221e740377ca Uploaded
bgruening
parents:
diff changeset
45 --fasta
221e740377ca Uploaded
bgruening
parents:
diff changeset
46 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
47 #else:
221e740377ca Uploaded
bgruening
parents:
diff changeset
48 --mate-paired
221e740377ca Uploaded
bgruening
parents:
diff changeset
49 --mate1 $singlePaired.input_mate1
221e740377ca Uploaded
bgruening
parents:
diff changeset
50 --mate2 $singlePaired.input_mate2
221e740377ca Uploaded
bgruening
parents:
diff changeset
51
221e740377ca Uploaded
bgruening
parents:
diff changeset
52 #if $singlePaired.input_mate1.ext == "fastqillumina":
221e740377ca Uploaded
bgruening
parents:
diff changeset
53 --phred64-quals
221e740377ca Uploaded
bgruening
parents:
diff changeset
54 --fastq
221e740377ca Uploaded
bgruening
parents:
diff changeset
55 #elif $singlePaired.input_mate1.ext == "fastqsanger":
221e740377ca Uploaded
bgruening
parents:
diff changeset
56 --fastq
221e740377ca Uploaded
bgruening
parents:
diff changeset
57 #elif $singlePaired.input_mate1.ext == "fasta":
221e740377ca Uploaded
bgruening
parents:
diff changeset
58 --fasta
221e740377ca Uploaded
bgruening
parents:
diff changeset
59 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
60
221e740377ca Uploaded
bgruening
parents:
diff changeset
61 -I $singlePaired.minInsert
221e740377ca Uploaded
bgruening
parents:
diff changeset
62 -X $singlePaired.maxInsert
221e740377ca Uploaded
bgruening
parents:
diff changeset
63 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
64
221e740377ca Uploaded
bgruening
parents:
diff changeset
65
221e740377ca Uploaded
bgruening
parents:
diff changeset
66 ## for now hardcode the value for the required memory per thread in --best mode
221e740377ca Uploaded
bgruening
parents:
diff changeset
67 --chunkmbs 512
221e740377ca Uploaded
bgruening
parents:
diff changeset
68
221e740377ca Uploaded
bgruening
parents:
diff changeset
69
221e740377ca Uploaded
bgruening
parents:
diff changeset
70 #if $params.settingsType == "custom":
221e740377ca Uploaded
bgruening
parents:
diff changeset
71
221e740377ca Uploaded
bgruening
parents:
diff changeset
72 ## default 20
221e740377ca Uploaded
bgruening
parents:
diff changeset
73 --seed-len $params.seed_len
221e740377ca Uploaded
bgruening
parents:
diff changeset
74 ## default 0
221e740377ca Uploaded
bgruening
parents:
diff changeset
75 --seed-mismatches $params.seed_mismatches
221e740377ca Uploaded
bgruening
parents:
diff changeset
76 ## default 15
221e740377ca Uploaded
bgruening
parents:
diff changeset
77 --seed-extention-attempts $params.seed_extention_attempts
221e740377ca Uploaded
bgruening
parents:
diff changeset
78 ## default 2
221e740377ca Uploaded
bgruening
parents:
diff changeset
79 --max-reseed $params.max_reseed
221e740377ca Uploaded
bgruening
parents:
diff changeset
80
221e740377ca Uploaded
bgruening
parents:
diff changeset
81 ## default 70
221e740377ca Uploaded
bgruening
parents:
diff changeset
82 ##--maqerr $params.maqerr
221e740377ca Uploaded
bgruening
parents:
diff changeset
83
221e740377ca Uploaded
bgruening
parents:
diff changeset
84 ## default unlimited
221e740377ca Uploaded
bgruening
parents:
diff changeset
85 #if $params.qupto != 0:
221e740377ca Uploaded
bgruening
parents:
diff changeset
86 --qupto $params.qupto
221e740377ca Uploaded
bgruening
parents:
diff changeset
87 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
88 #if $params.skip_reads != 0:
221e740377ca Uploaded
bgruening
parents:
diff changeset
89 --skip-reads $params.skip_reads
221e740377ca Uploaded
bgruening
parents:
diff changeset
90 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
91
221e740377ca Uploaded
bgruening
parents:
diff changeset
92 ## if set, disable the original behaviour
221e740377ca Uploaded
bgruening
parents:
diff changeset
93 $params.no_mixed
221e740377ca Uploaded
bgruening
parents:
diff changeset
94 ## if set, disable the original behaviour
221e740377ca Uploaded
bgruening
parents:
diff changeset
95 $params.no_discordant
221e740377ca Uploaded
bgruening
parents:
diff changeset
96
221e740377ca Uploaded
bgruening
parents:
diff changeset
97
221e740377ca Uploaded
bgruening
parents:
diff changeset
98 ###if str($params.isReportOutput) == "yes":
221e740377ca Uploaded
bgruening
parents:
diff changeset
99 ## --output-report-file $report_file
221e740377ca Uploaded
bgruening
parents:
diff changeset
100 ###end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
101
221e740377ca Uploaded
bgruening
parents:
diff changeset
102 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
103
221e740377ca Uploaded
bgruening
parents:
diff changeset
104 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
105 ## Output parameters.
221e740377ca Uploaded
bgruening
parents:
diff changeset
106 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
107 --output $output
221e740377ca Uploaded
bgruening
parents:
diff changeset
108 $suppress_header
221e740377ca Uploaded
bgruening
parents:
diff changeset
109
221e740377ca Uploaded
bgruening
parents:
diff changeset
110 #if str( $singlePaired.sPaired ) == "single"
221e740377ca Uploaded
bgruening
parents:
diff changeset
111 #if $output_unmapped_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
112 --output-unmapped-reads $output_unmapped_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
113 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
114 #if $output_suppressed_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
115 --output-suppressed-reads $output_suppressed_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
116 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
117 #else
221e740377ca Uploaded
bgruening
parents:
diff changeset
118 #if $output_unmapped_reads_l and $output_unmapped_reads_r
221e740377ca Uploaded
bgruening
parents:
diff changeset
119 --output-unmapped-reads-l $output_unmapped_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
120 --output-unmapped-reads-r $output_unmapped_reads_r
221e740377ca Uploaded
bgruening
parents:
diff changeset
121 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
122 #if $output_suppressed_reads_l and $output_suppressed_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
123 --output-suppressed-reads-l $output_suppressed_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
124 --output-suppressed-reads-r $output_suppressed_reads_r
221e740377ca Uploaded
bgruening
parents:
diff changeset
125 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
126 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
127
221e740377ca Uploaded
bgruening
parents:
diff changeset
128 </command>
221e740377ca Uploaded
bgruening
parents:
diff changeset
129 <inputs>
221e740377ca Uploaded
bgruening
parents:
diff changeset
130 <conditional name="refGenomeSource">
221e740377ca Uploaded
bgruening
parents:
diff changeset
131 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options">
221e740377ca Uploaded
bgruening
parents:
diff changeset
132 <option value="indexed">Use a built-in index</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
133 <option value="history">Use one from the history</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
134 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
135 <when value="indexed">
221e740377ca Uploaded
bgruening
parents:
diff changeset
136 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact your Galaxy admin">
221e740377ca Uploaded
bgruening
parents:
diff changeset
137 <options from_data_table="bowtie_indexes">
221e740377ca Uploaded
bgruening
parents:
diff changeset
138 <filter type="sort_by" column="2"/>
221e740377ca Uploaded
bgruening
parents:
diff changeset
139 <validator type="no_options" message="No indexes are available for the selected input dataset"/>
221e740377ca Uploaded
bgruening
parents:
diff changeset
140 </options>
221e740377ca Uploaded
bgruening
parents:
diff changeset
141 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
142 </when> <!-- build-in -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
143 <when value="history">
221e740377ca Uploaded
bgruening
parents:
diff changeset
144 <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select the reference genome" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
145 </when> <!-- history -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
146 </conditional> <!-- refGenomeSource -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
147
221e740377ca Uploaded
bgruening
parents:
diff changeset
148 <!-- Input Parameters -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
149 <conditional name="singlePaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
150 <param name="sPaired" type="select" label="Is this library mate-paired?">
221e740377ca Uploaded
bgruening
parents:
diff changeset
151 <option value="single">Single-end</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
152 <option value="paired">Paired-end</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
153 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
154 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
155 <param name="input_singles" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
156 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
157 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
158 <param name="input_mate1" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
159 <param name="input_mate2" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
160 <param name="minInsert" type="integer" value="0" label="Minimum insert size for valid paired-end alignments" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
161 <param name="maxInsert" type="integer" value="250" label="Maximum insert size for valid paired-end alignments" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
162 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
163 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
164
221e740377ca Uploaded
bgruening
parents:
diff changeset
165
221e740377ca Uploaded
bgruening
parents:
diff changeset
166 <conditional name="params">
221e740377ca Uploaded
bgruening
parents:
diff changeset
167 <param name="settingsType" type="select" label="Bismark settings to use" help="You can use the default settings or set custom values for any of Bismark's parameters.">
221e740377ca Uploaded
bgruening
parents:
diff changeset
168 <option value="default">Use Defaults</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
169 <option value="custom">Full parameter list</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
170 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
171 <when value="default" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
172 <!-- Full/advanced params. -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
173 <when value="custom">
221e740377ca Uploaded
bgruening
parents:
diff changeset
174 <!-- -n -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
175 <param name="seed_mismatches" type="select" label="The maximum number of mismatches permitted in the 'seed'.">
221e740377ca Uploaded
bgruening
parents:
diff changeset
176 <option value="0">0</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
177 <option value="1">1</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
178 <option value="2" selected="true">2</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
179 <option value="3">3</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
180 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
181 <!-- -l -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
182 <param name="seed_len" type="integer" value="28" label="The 'seed length'; The number of bases of the high quality end of the read to which the maximum number of mismatches applies." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
183 <!--
221e740377ca Uploaded
bgruening
parents:
diff changeset
184 <param name="maqerr" type="integer" value="70" label="Maximum permitted total of quality values at all mismatched read positions throughout the entire alignment, not just in the 'seed'." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
185 -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
186 <param name="qupto" type="integer" value="0" label="Only aligns the first N reads or read pairs from the input" help="Default is 0 and means 'no-limit'." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
187 <param name="skip_reads" type="integer" value="0" label="Skip (i.e. do not align) the first N reads or read pairs from the input" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
188
221e740377ca Uploaded
bgruening
parents:
diff changeset
189 <param name="no_discordant" type="boolean" truevalue="--no-discordant" falsevalue="" checked="False" label="Disable looking for discordant alignments if it cannot find any concordant alignments" help="" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
190 <param name="no_mixed" type="boolean" truevalue="--no-mixed" falsevalue="" checked="False" label="Disable Bowtie 2's behaviour to try to find alignments for the individual mates" help="" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
191
221e740377ca Uploaded
bgruening
parents:
diff changeset
192 <param name="suppressed_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write ambiguous reads to an extra output file." help="Write all reads which produce more than one valid alignment with the same number of lowest mismatches or other reads that fail to align uniquely." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
193 <param name="unmapped_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write all reads that could not be aligned to a file" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
194 <!-- output Options -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
195 <!--
221e740377ca Uploaded
bgruening
parents:
diff changeset
196 <param name="isReportOutput" type="select" label="Offer all report files concatenated in one file.">
221e740377ca Uploaded
bgruening
parents:
diff changeset
197 <option value="yes">yes</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
198 <option value="no">no</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
199 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
200 -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
201 <!--end output options -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
202 </when> <!-- full -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
203 </conditional> <!-- params -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
204 <param name="suppress_header" type="boolean" truevalue="--suppress-header" falsevalue="" checked="False" label="Suppress the header in the output SAM file" help="Bowtie produces SAM with several lines of header information by default" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
205 </inputs>
221e740377ca Uploaded
bgruening
parents:
diff changeset
206 <outputs>
221e740377ca Uploaded
bgruening
parents:
diff changeset
207 <!-- that does not work
221e740377ca Uploaded
bgruening
parents:
diff changeset
208 <data format="txt" name="report_file" label="${tool.name} on ${on_string}: Report">
221e740377ca Uploaded
bgruening
parents:
diff changeset
209 <filter>str($params.isReportOutput) == "yes"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
210 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
211 -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
212 <data format="sam" name="output" label="${tool.name} on ${on_string}: mapped reads">
221e740377ca Uploaded
bgruening
parents:
diff changeset
213 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
214 <conditional name="refGenomeSource.genomeSource">
221e740377ca Uploaded
bgruening
parents:
diff changeset
215 <when value="indexed">
221e740377ca Uploaded
bgruening
parents:
diff changeset
216 <action type="metadata" name="dbkey">
221e740377ca Uploaded
bgruening
parents:
diff changeset
217 <option type="from_data_table" name="bowtie2_indexes" column="1" offset="0">
221e740377ca Uploaded
bgruening
parents:
diff changeset
218 <filter type="param_value" column="0" value="#" compare="startswith" keep="False"/>
221e740377ca Uploaded
bgruening
parents:
diff changeset
219 <filter type="param_value" ref="refGenomeSource.index" column="0"/>
221e740377ca Uploaded
bgruening
parents:
diff changeset
220 </option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
221 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
222 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
223 <when value="history">
221e740377ca Uploaded
bgruening
parents:
diff changeset
224 <action type="metadata" name="dbkey">
221e740377ca Uploaded
bgruening
parents:
diff changeset
225 <option type="from_param" name="refGenomeSource.ownFile" param_attribute="dbkey" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
226 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
227 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
228 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
229 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
230 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
231
221e740377ca Uploaded
bgruening
parents:
diff changeset
232 <data format="fastq" name="output_suppressed_reads_l" label="${tool.name} on ${on_string}: suppressed reads (L)">
221e740377ca Uploaded
bgruening
parents:
diff changeset
233 <filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
234 ((
221e740377ca Uploaded
bgruening
parents:
diff changeset
235 params['settingsType'] == "custom" and
221e740377ca Uploaded
bgruening
parents:
diff changeset
236 params['suppressed_read_file'] is True
221e740377ca Uploaded
bgruening
parents:
diff changeset
237 ))
221e740377ca Uploaded
bgruening
parents:
diff changeset
238 </filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
239 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
240 <conditional name="singlePaired.sPaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
241 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
242 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
243 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
244 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
245 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
246 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
247 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
248 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
249 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
250 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
251 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
252 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
253 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
254
221e740377ca Uploaded
bgruening
parents:
diff changeset
255 <data format="fastq" name="output_suppressed_reads_r" label="${tool.name} on ${on_string}: suppressed reads (R)">
221e740377ca Uploaded
bgruening
parents:
diff changeset
256 <filter>singlePaired['sPaired'] == "paired"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
257 <filter>params['settingsType'] == "custom"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
258 <filter>params['supressed_read_file'] is True</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
259 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
260 <conditional name="singlePaired.sPaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
261 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
262 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
263 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
264 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
265 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
266 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
267 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
268 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
269 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
270 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
271 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
272 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
273 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
274
221e740377ca Uploaded
bgruening
parents:
diff changeset
275 <!-- Outout unmapped reads -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
276 <data format="fastq" name="output_unmapped_reads_l" label="${tool.name} on ${on_string}: unmapped reads (L)">
221e740377ca Uploaded
bgruening
parents:
diff changeset
277 <filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
278 ((
221e740377ca Uploaded
bgruening
parents:
diff changeset
279 params['settingsType'] == "custom" and
221e740377ca Uploaded
bgruening
parents:
diff changeset
280 params['unmapped_read_file'] is True
221e740377ca Uploaded
bgruening
parents:
diff changeset
281 ))
221e740377ca Uploaded
bgruening
parents:
diff changeset
282 </filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
283 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
284 <conditional name="singlePaired.sPaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
285 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
286 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
287 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
288 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
289 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
290 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
291 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
292 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
293 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
294 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
295 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
296 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
297 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
298 <data format="fastq" name="output_unmapped_reads_r" label="${tool.name} on ${on_string}: unmapped reads (R)">
221e740377ca Uploaded
bgruening
parents:
diff changeset
299 <filter>singlePaired['sPaired'] == "paired"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
300 <filter>params['settingsType'] == "custom"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
301 <filter>params['unmapped_read_file'] is True</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
302 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
303 <conditional name="singlePaired.sPaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
304 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
305 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
306 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
307 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
308 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
309 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
310 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
311 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
312 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
313 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
314 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
315 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
316 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
317
221e740377ca Uploaded
bgruening
parents:
diff changeset
318
221e740377ca Uploaded
bgruening
parents:
diff changeset
319 </outputs>
221e740377ca Uploaded
bgruening
parents:
diff changeset
320
221e740377ca Uploaded
bgruening
parents:
diff changeset
321 <tests>
221e740377ca Uploaded
bgruening
parents:
diff changeset
322 </tests>
221e740377ca Uploaded
bgruening
parents:
diff changeset
323
221e740377ca Uploaded
bgruening
parents:
diff changeset
324 <help>
221e740377ca Uploaded
bgruening
parents:
diff changeset
325
221e740377ca Uploaded
bgruening
parents:
diff changeset
326 **What it does**
221e740377ca Uploaded
bgruening
parents:
diff changeset
327
221e740377ca Uploaded
bgruening
parents:
diff changeset
328 Bismark_ is a bisulfite mapper and methylation caller. Bismark takes in FastA or FastQ files and aligns the
221e740377ca Uploaded
bgruening
parents:
diff changeset
329 reads to a specified bisulfite genome. Sequence reads are transformed into a bisulfite converted forward strand
221e740377ca Uploaded
bgruening
parents:
diff changeset
330 version (C->T conversion) or into a bisulfite treated reverse strand (G->A conversion of the forward strand).
221e740377ca Uploaded
bgruening
parents:
diff changeset
331 Each of these reads are then aligned to bisulfite treated forward strand index of a reference genome
221e740377ca Uploaded
bgruening
parents:
diff changeset
332 (C->T converted) and a bisulfite treated reverse strand index of the genome (G->A conversion of the
221e740377ca Uploaded
bgruening
parents:
diff changeset
333 forward strand, by doing this alignments will produce the same positions). These 4 instances of Bowtie (1 or 2)
221e740377ca Uploaded
bgruening
parents:
diff changeset
334 are run in parallel. The sequence file(s) are then read in again sequence by sequence to pull out the original
221e740377ca Uploaded
bgruening
parents:
diff changeset
335 sequence from the genome and determine if there were any protected C's present or not.
221e740377ca Uploaded
bgruening
parents:
diff changeset
336
221e740377ca Uploaded
bgruening
parents:
diff changeset
337 .. _Bismark: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
221e740377ca Uploaded
bgruening
parents:
diff changeset
338
221e740377ca Uploaded
bgruening
parents:
diff changeset
339 As of version 0.7.0 Bismark will only run 2 alignment threads for OT and OB in parallel, the 4 strand mode can be
221e740377ca Uploaded
bgruening
parents:
diff changeset
340 re-enabled by using non_directional mode.
221e740377ca Uploaded
bgruening
parents:
diff changeset
341
221e740377ca Uploaded
bgruening
parents:
diff changeset
342 It is developed by Krueger F and Andrews SR. at the Babraham Institute. Krueger F, Andrews SR. (2011) Bismark: a flexible aligner and methylation caller for Bisulfite-Seq applications. Bioinformatics, 27, 1571-2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
343
221e740377ca Uploaded
bgruening
parents:
diff changeset
344 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
345
221e740377ca Uploaded
bgruening
parents:
diff changeset
346 **Know what you are doing**
221e740377ca Uploaded
bgruening
parents:
diff changeset
347
221e740377ca Uploaded
bgruening
parents:
diff changeset
348 .. class:: warningmark
221e740377ca Uploaded
bgruening
parents:
diff changeset
349
221e740377ca Uploaded
bgruening
parents:
diff changeset
350 There is no such thing (yet) as an automated gearshift in short read mapping. It is all like stick-shift driving in San Francisco. In other words = running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy.
221e740377ca Uploaded
bgruening
parents:
diff changeset
351
221e740377ca Uploaded
bgruening
parents:
diff changeset
352 .. __: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
221e740377ca Uploaded
bgruening
parents:
diff changeset
353
221e740377ca Uploaded
bgruening
parents:
diff changeset
354 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
355
221e740377ca Uploaded
bgruening
parents:
diff changeset
356 **Input formats**
221e740377ca Uploaded
bgruening
parents:
diff changeset
357
221e740377ca Uploaded
bgruening
parents:
diff changeset
358 Bismark accepts files in either Sanger FASTQ format (galaxy type *fastqsanger*), Illumina FASTQ format (galaxy type *fastqillumina*) or FASTA format (galaxy type *fasta*). Use the FASTQ Groomer to prepare your files.
221e740377ca Uploaded
bgruening
parents:
diff changeset
359
221e740377ca Uploaded
bgruening
parents:
diff changeset
360 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
361
221e740377ca Uploaded
bgruening
parents:
diff changeset
362 **A Note on Built-in Reference Genomes**
221e740377ca Uploaded
bgruening
parents:
diff changeset
363
221e740377ca Uploaded
bgruening
parents:
diff changeset
364 The default variant for all genomes is "Full", defined as all primary chromosomes (or scaffolds/contigs) including mitochondrial plus associated unmapped, plasmid, and other segments. When only one version of a genome is available in this tool, it represents the default "Full" variant. Some genomes will have more than one variant available. The "Canonical Male" or sometimes simply "Canonical" variant contains the primary chromosomes for a genome. For example a human "Canonical" variant contains chr1-chr22, chrX, chrY, and chrM. The "Canonical Female" variant contains the primary chromosomes excluding chrY.
221e740377ca Uploaded
bgruening
parents:
diff changeset
365
221e740377ca Uploaded
bgruening
parents:
diff changeset
366 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
367
221e740377ca Uploaded
bgruening
parents:
diff changeset
368 The final output of Bismark is in SAM format by default.
221e740377ca Uploaded
bgruening
parents:
diff changeset
369
221e740377ca Uploaded
bgruening
parents:
diff changeset
370 **Outputs**
221e740377ca Uploaded
bgruening
parents:
diff changeset
371
221e740377ca Uploaded
bgruening
parents:
diff changeset
372 The output is in SAM format, and has the following columns::
221e740377ca Uploaded
bgruening
parents:
diff changeset
373
221e740377ca Uploaded
bgruening
parents:
diff changeset
374 Column Description
221e740377ca Uploaded
bgruening
parents:
diff changeset
375 -------- --------------------------------------------------------
221e740377ca Uploaded
bgruening
parents:
diff changeset
376 1 QNAME seq-ID
221e740377ca Uploaded
bgruening
parents:
diff changeset
377 2 FLAG this flag tries to take the strand a bisulfite read
221e740377ca Uploaded
bgruening
parents:
diff changeset
378 originated from into account
221e740377ca Uploaded
bgruening
parents:
diff changeset
379 (this is different from ordinary DNA alignment flags!)
221e740377ca Uploaded
bgruening
parents:
diff changeset
380 3 RNAME chromosome
221e740377ca Uploaded
bgruening
parents:
diff changeset
381 4 POS start position
221e740377ca Uploaded
bgruening
parents:
diff changeset
382 5 MAPQ always 255
221e740377ca Uploaded
bgruening
parents:
diff changeset
383 6 CIGAR extended CIGAR string
221e740377ca Uploaded
bgruening
parents:
diff changeset
384 7 MRNM Mate Reference sequence NaMe ('=' if same as RNAME)
221e740377ca Uploaded
bgruening
parents:
diff changeset
385 8 MPOS 1-based Mate POSition
221e740377ca Uploaded
bgruening
parents:
diff changeset
386 9 ISIZE Inferred insert SIZE
221e740377ca Uploaded
bgruening
parents:
diff changeset
387 10 SEQ query SEQuence on the same strand as the reference
221e740377ca Uploaded
bgruening
parents:
diff changeset
388 11 QUAL Phred33 scale
221e740377ca Uploaded
bgruening
parents:
diff changeset
389 12 NM-tag edit distance to the reference)
221e740377ca Uploaded
bgruening
parents:
diff changeset
390 13 XX-tag base-by-base mismatches to the reference.
221e740377ca Uploaded
bgruening
parents:
diff changeset
391 This does not include indels.
221e740377ca Uploaded
bgruening
parents:
diff changeset
392 14 XM-tag methylation call string
221e740377ca Uploaded
bgruening
parents:
diff changeset
393 15 XR-tag read conversion state for the alignment
221e740377ca Uploaded
bgruening
parents:
diff changeset
394 16 XG-tag genome conversion state for the alignment
221e740377ca Uploaded
bgruening
parents:
diff changeset
395
221e740377ca Uploaded
bgruening
parents:
diff changeset
396
221e740377ca Uploaded
bgruening
parents:
diff changeset
397 Each read of paired-end alignments is written out in a separate line in the above format.
221e740377ca Uploaded
bgruening
parents:
diff changeset
398
221e740377ca Uploaded
bgruening
parents:
diff changeset
399
221e740377ca Uploaded
bgruening
parents:
diff changeset
400 It looks like this (scroll sideways to see the entire example)::
221e740377ca Uploaded
bgruening
parents:
diff changeset
401
221e740377ca Uploaded
bgruening
parents:
diff changeset
402 QNAME FLAG RNAME POS MAPQ CIAGR MRNM MPOS ISIZE SEQ QUAL OPT
221e740377ca Uploaded
bgruening
parents:
diff changeset
403 HWI-EAS91_1_30788AAXX:1:1:1761:343 4 * 0 0 * * 0 0 AAAAAAANNAAAAAAAAAAAAAAAAAAAAAAAAAAACNNANNGAGTNGNNNNNNNGCTTCCCACAGNNCTGG hhhhhhh;;hhhhhhhhhhh^hOhhhhghhhfhhhgh;;h;;hhhh;h;;;;;;;hhhhhhghhhh;;Phhh
221e740377ca Uploaded
bgruening
parents:
diff changeset
404 HWI-EAS91_1_30788AAXX:1:1:1578:331 4 * 0 0 * * 0 0 GTATAGANNAATAAGAAAAAAAAAAATGAAGACTTTCNNANNTCTGNANNNNNNNTCTTTTTTCAGNNGTAG hhhhhhh;;hhhhhhhhhhhhhhhhhhhhhhhhhhhh;;h;;hhhh;h;;;;;;;hhhhhhhhhhh;;hhVh
221e740377ca Uploaded
bgruening
parents:
diff changeset
405
221e740377ca Uploaded
bgruening
parents:
diff changeset
406 -------
221e740377ca Uploaded
bgruening
parents:
diff changeset
407
221e740377ca Uploaded
bgruening
parents:
diff changeset
408 **Bismark settings**
221e740377ca Uploaded
bgruening
parents:
diff changeset
409
221e740377ca Uploaded
bgruening
parents:
diff changeset
410 All of the options have a default value. You can change any of them. If any Bismark function is missing please contact the tool author or your Galaxy admin.
221e740377ca Uploaded
bgruening
parents:
diff changeset
411
221e740377ca Uploaded
bgruening
parents:
diff changeset
412 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
413
221e740377ca Uploaded
bgruening
parents:
diff changeset
414 **Bismark parameter list**
221e740377ca Uploaded
bgruening
parents:
diff changeset
415
221e740377ca Uploaded
bgruening
parents:
diff changeset
416 This is an exhaustive list of Bismark options:
221e740377ca Uploaded
bgruening
parents:
diff changeset
417
221e740377ca Uploaded
bgruening
parents:
diff changeset
418 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
419
221e740377ca Uploaded
bgruening
parents:
diff changeset
420 **OPTIONS**
221e740377ca Uploaded
bgruening
parents:
diff changeset
421
221e740377ca Uploaded
bgruening
parents:
diff changeset
422
221e740377ca Uploaded
bgruening
parents:
diff changeset
423 Input::
221e740377ca Uploaded
bgruening
parents:
diff changeset
424
221e740377ca Uploaded
bgruening
parents:
diff changeset
425 --singles A comma- or space-separated list of files containing the reads to be aligned (e.g.
221e740377ca Uploaded
bgruening
parents:
diff changeset
426 lane1.fq,lane2.fq lane3.fq). Reads may be a mix of different lengths. Bismark will
221e740377ca Uploaded
bgruening
parents:
diff changeset
427 produce one mapping result and one report file per input file.
221e740377ca Uploaded
bgruening
parents:
diff changeset
428
221e740377ca Uploaded
bgruening
parents:
diff changeset
429 -1 mates1 Comma-separated list of files containing the #1 mates (filename usually includes
221e740377ca Uploaded
bgruening
parents:
diff changeset
430 "_1"), e.g. flyA_1.fq,flyB_1.fq). Sequences specified with this option must
221e740377ca Uploaded
bgruening
parents:
diff changeset
431 correspond file-for-file and read-for-read with those specified in mates2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
432 Reads may be a mix of different lengths. Bismark will produce one mapping result
221e740377ca Uploaded
bgruening
parents:
diff changeset
433 and one report file per paired-end input file pair.
221e740377ca Uploaded
bgruening
parents:
diff changeset
434
221e740377ca Uploaded
bgruening
parents:
diff changeset
435 -2 mates2 Comma-separated list of files containing the #2 mates (filename usually includes
221e740377ca Uploaded
bgruening
parents:
diff changeset
436 "_2"), e.g. flyA_1.fq,flyB_1.fq). Sequences specified with this option must
221e740377ca Uploaded
bgruening
parents:
diff changeset
437 correspond file-for-file and read-for-read with those specified in mates1.
221e740377ca Uploaded
bgruening
parents:
diff changeset
438 Reads may be a mix of different lengths.
221e740377ca Uploaded
bgruening
parents:
diff changeset
439
221e740377ca Uploaded
bgruening
parents:
diff changeset
440 -q/--fastq The query input files (specified as mate1,mate2 or singles are FASTQ
221e740377ca Uploaded
bgruening
parents:
diff changeset
441 files (usually having extension .fg or .fastq). This is the default. See also
221e740377ca Uploaded
bgruening
parents:
diff changeset
442 --solexa-quals.
221e740377ca Uploaded
bgruening
parents:
diff changeset
443
221e740377ca Uploaded
bgruening
parents:
diff changeset
444 -f/--fasta The query input files (specified as mate1,mate2 or singles are FASTA
221e740377ca Uploaded
bgruening
parents:
diff changeset
445 files (usually havin extension .fa, .mfa, .fna or similar). All quality values
221e740377ca Uploaded
bgruening
parents:
diff changeset
446 are assumed to be 40 on the Phred scale.
221e740377ca Uploaded
bgruening
parents:
diff changeset
447
221e740377ca Uploaded
bgruening
parents:
diff changeset
448 -s/--skip INT Skip (i.e. do not align) the first INT reads or read pairs from the input.
221e740377ca Uploaded
bgruening
parents:
diff changeset
449
221e740377ca Uploaded
bgruening
parents:
diff changeset
450 -u/--upto INT Only aligns the first INT reads or read pairs from the input. Default: no limit.
221e740377ca Uploaded
bgruening
parents:
diff changeset
451
221e740377ca Uploaded
bgruening
parents:
diff changeset
452 --phred33-quals FASTQ qualities are ASCII chars equal to the Phred quality plus 33. Default: on.
221e740377ca Uploaded
bgruening
parents:
diff changeset
453
221e740377ca Uploaded
bgruening
parents:
diff changeset
454 --phred64-quals FASTQ qualities are ASCII chars equal to the Phred quality plus 64. Default: off.
221e740377ca Uploaded
bgruening
parents:
diff changeset
455
221e740377ca Uploaded
bgruening
parents:
diff changeset
456 --solexa-quals Convert FASTQ qualities from solexa-scaled (which can be negative) to phred-scaled
221e740377ca Uploaded
bgruening
parents:
diff changeset
457 (which can't). The formula for conversion is:
221e740377ca Uploaded
bgruening
parents:
diff changeset
458 phred-qual = 10 * log(1 + 10 ** (solexa-qual/10.0)) / log(10). Used with -q. This
221e740377ca Uploaded
bgruening
parents:
diff changeset
459 is usually the right option for use with (unconverted) reads emitted by the GA
221e740377ca Uploaded
bgruening
parents:
diff changeset
460 Pipeline versions prior to 1.3. Works only for Bowtie 1. Default: off.
221e740377ca Uploaded
bgruening
parents:
diff changeset
461
221e740377ca Uploaded
bgruening
parents:
diff changeset
462 --solexa1.3-quals Same as --phred64-quals. This is usually the right option for use with (unconverted)
221e740377ca Uploaded
bgruening
parents:
diff changeset
463 reads emitted by GA Pipeline version 1.3 or later. Default: off.
221e740377ca Uploaded
bgruening
parents:
diff changeset
464
221e740377ca Uploaded
bgruening
parents:
diff changeset
465
221e740377ca Uploaded
bgruening
parents:
diff changeset
466 Alignment::
221e740377ca Uploaded
bgruening
parents:
diff changeset
467
221e740377ca Uploaded
bgruening
parents:
diff changeset
468 -n/--seedmms INT The maximum number of mismatches permitted in the "seed", i.e. the first L base pairs
221e740377ca Uploaded
bgruening
parents:
diff changeset
469 of the read (where L is set with -l/--seedlen). This may be 0, 1, 2 or 3 and the
221e740377ca Uploaded
bgruening
parents:
diff changeset
470 default is 1. This option is only available for Bowtie 1 (for Bowtie 2 see -N).
221e740377ca Uploaded
bgruening
parents:
diff changeset
471
221e740377ca Uploaded
bgruening
parents:
diff changeset
472 -l/--seedlen The "seed length"; i.e., the number of bases of the high quality end of the read to
221e740377ca Uploaded
bgruening
parents:
diff changeset
473 which the -n ceiling applies. The default is 28. Bowtie (and thus Bismark) is faster for
221e740377ca Uploaded
bgruening
parents:
diff changeset
474 larger values of -l. This option is only available for Bowtie 1 (for Bowtie 2 see -L).
221e740377ca Uploaded
bgruening
parents:
diff changeset
475
221e740377ca Uploaded
bgruening
parents:
diff changeset
476 -e/--maqerr INT Maximum permitted total of quality values at all mismatched read positions throughout
221e740377ca Uploaded
bgruening
parents:
diff changeset
477 the entire alignment, not just in the "seed". The default is 70. Like Maq, bowtie rounds
221e740377ca Uploaded
bgruening
parents:
diff changeset
478 quality values to the nearest 10 and saturates at 30. This value is not relevant for
221e740377ca Uploaded
bgruening
parents:
diff changeset
479 Bowtie 2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
480
221e740377ca Uploaded
bgruening
parents:
diff changeset
481 --chunkmbs INT The number of megabytes of memory a given thread is given to store path descriptors in
221e740377ca Uploaded
bgruening
parents:
diff changeset
482 --best mode. Best-first search must keep track of many paths at once to ensure it is
221e740377ca Uploaded
bgruening
parents:
diff changeset
483 always extending the path with the lowest cumulative cost. Bowtie tries to minimize the
221e740377ca Uploaded
bgruening
parents:
diff changeset
484 memory impact of the descriptors, but they can still grow very large in some cases. If
221e740377ca Uploaded
bgruening
parents:
diff changeset
485 you receive an error message saying that chunk memory has been exhausted in --best mode,
221e740377ca Uploaded
bgruening
parents:
diff changeset
486 try adjusting this parameter up to dedicate more memory to the descriptors. This value
221e740377ca Uploaded
bgruening
parents:
diff changeset
487 is not relevant for Bowtie 2. Default: 512.
221e740377ca Uploaded
bgruening
parents:
diff changeset
488
221e740377ca Uploaded
bgruening
parents:
diff changeset
489 -I/--minins INT The minimum insert size for valid paired-end alignments. E.g. if -I 60 is specified and
221e740377ca Uploaded
bgruening
parents:
diff changeset
490 a paired-end alignment consists of two 20-bp alignments in the appropriate orientation
221e740377ca Uploaded
bgruening
parents:
diff changeset
491 with a 20-bp gap between them, that alignment is considered valid (as long as -X is also
221e740377ca Uploaded
bgruening
parents:
diff changeset
492 satisfied). A 19-bp gap would not be valid in that case. Default: 0.
221e740377ca Uploaded
bgruening
parents:
diff changeset
493
221e740377ca Uploaded
bgruening
parents:
diff changeset
494 -X/--maxins INT The maximum insert size for valid paired-end alignments. E.g. if -X 100 is specified and
221e740377ca Uploaded
bgruening
parents:
diff changeset
495 a paired-end alignment consists of two 20-bp alignments in the proper orientation with a
221e740377ca Uploaded
bgruening
parents:
diff changeset
496 60-bp gap between them, that alignment is considered valid (as long as -I is also satisfied).
221e740377ca Uploaded
bgruening
parents:
diff changeset
497 A 61-bp gap would not be valid in that case. Default: 500.
221e740377ca Uploaded
bgruening
parents:
diff changeset
498
221e740377ca Uploaded
bgruening
parents:
diff changeset
499
221e740377ca Uploaded
bgruening
parents:
diff changeset
500
221e740377ca Uploaded
bgruening
parents:
diff changeset
501 Output::
221e740377ca Uploaded
bgruening
parents:
diff changeset
502
221e740377ca Uploaded
bgruening
parents:
diff changeset
503 --non_directional The sequencing library was constructed in a non strand-specific manner, alignments to all four
221e740377ca Uploaded
bgruening
parents:
diff changeset
504 bisulfite strands will be reported. Default: OFF.
221e740377ca Uploaded
bgruening
parents:
diff changeset
505
221e740377ca Uploaded
bgruening
parents:
diff changeset
506 (The current Illumina protocol for BS-Seq is directional, in which case the strands complementary
221e740377ca Uploaded
bgruening
parents:
diff changeset
507 to the original strands are merely theoretical and should not exist in reality. Specifying directional
221e740377ca Uploaded
bgruening
parents:
diff changeset
508 alignments (which is the default) will only run 2 alignment threads to the original top (OT)
221e740377ca Uploaded
bgruening
parents:
diff changeset
509 or bottom (OB) strands in parallel and report these alignments. This is the recommended option
221e740377ca Uploaded
bgruening
parents:
diff changeset
510 for sprand-specific libraries).
221e740377ca Uploaded
bgruening
parents:
diff changeset
511
221e740377ca Uploaded
bgruening
parents:
diff changeset
512 --sam-no-hd Suppress SAM header lines (starting with @). This might be useful when very large input files are
221e740377ca Uploaded
bgruening
parents:
diff changeset
513 split up into several smaller files to run concurrently and the output files are to be merged.
221e740377ca Uploaded
bgruening
parents:
diff changeset
514
221e740377ca Uploaded
bgruening
parents:
diff changeset
515 --quiet Print nothing besides alignments.
221e740377ca Uploaded
bgruening
parents:
diff changeset
516
221e740377ca Uploaded
bgruening
parents:
diff changeset
517 --vanilla Performs bisulfite mapping with Bowtie 1 and prints the 'old' output (as in Bismark 0.5.X) instead
221e740377ca Uploaded
bgruening
parents:
diff changeset
518 of SAM format output.
221e740377ca Uploaded
bgruening
parents:
diff changeset
519
221e740377ca Uploaded
bgruening
parents:
diff changeset
520 -un/--unmapped Write all reads that could not be aligned to a file in the output directory. Written reads will
221e740377ca Uploaded
bgruening
parents:
diff changeset
521 appear as they did in the input, without any translation of quality values that may have
221e740377ca Uploaded
bgruening
parents:
diff changeset
522 taken place within Bowtie or Bismark. Paired-end reads will be written to two parallel files with _1
221e740377ca Uploaded
bgruening
parents:
diff changeset
523 and _2 inserted in their filenames, i.e. _unmapped_reads_1.txt and unmapped_reads_2.txt. Reads
221e740377ca Uploaded
bgruening
parents:
diff changeset
524 with more than one valid alignment with the same number of lowest mismatches (ambiguous mapping)
221e740377ca Uploaded
bgruening
parents:
diff changeset
525 are also written to _unmapped_reads.txt unless the option --ambiguous is specified as well.
221e740377ca Uploaded
bgruening
parents:
diff changeset
526
221e740377ca Uploaded
bgruening
parents:
diff changeset
527 --ambiguous Write all reads which produce more than one valid alignment with the same number of lowest
221e740377ca Uploaded
bgruening
parents:
diff changeset
528 mismatches or other reads that fail to align uniquely to a file in the output directory.
221e740377ca Uploaded
bgruening
parents:
diff changeset
529 Written reads will appear as they did in the input, without any of the translation of quality
221e740377ca Uploaded
bgruening
parents:
diff changeset
530 values that may have taken place within Bowtie or Bismark. Paired-end reads will be written to two
221e740377ca Uploaded
bgruening
parents:
diff changeset
531 parallel files with _1 and _2 inserted in theit filenames, i.e. _ambiguous_reads_1.txt and
221e740377ca Uploaded
bgruening
parents:
diff changeset
532 _ambiguous_reads_2.txt. These reads are not written to the file specified with --un.
221e740377ca Uploaded
bgruening
parents:
diff changeset
533
221e740377ca Uploaded
bgruening
parents:
diff changeset
534 -o/--output_dir DIR Write all output files into this directory. By default the output files will be written into
221e740377ca Uploaded
bgruening
parents:
diff changeset
535 the same folder as the input file(s). If the specified folder does not exist, Bismark will attempt
221e740377ca Uploaded
bgruening
parents:
diff changeset
536 to create it first. The path to the output folder can be either relative or absolute.
221e740377ca Uploaded
bgruening
parents:
diff changeset
537
221e740377ca Uploaded
bgruening
parents:
diff changeset
538 --temp_dir DIR Write temporary files to this directory instead of into the same directory as the input files. If
221e740377ca Uploaded
bgruening
parents:
diff changeset
539 the specified folder does not exist, Bismark will attempt to create it first. The path to the
221e740377ca Uploaded
bgruening
parents:
diff changeset
540 temporary folder can be either relative or absolute.
221e740377ca Uploaded
bgruening
parents:
diff changeset
541
221e740377ca Uploaded
bgruening
parents:
diff changeset
542 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
543
221e740377ca Uploaded
bgruening
parents:
diff changeset
544 Bowtie 2 alignment options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
545
221e740377ca Uploaded
bgruening
parents:
diff changeset
546 -N INT Sets the number of mismatches to allowed in a seed alignment during multiseed alignment.
221e740377ca Uploaded
bgruening
parents:
diff changeset
547 Can be set to 0 or 1. Setting this higher makes alignment slower (often much slower)
221e740377ca Uploaded
bgruening
parents:
diff changeset
548 but increases sensitivity. Default: 0. This option is only available for Bowtie 2 (for
221e740377ca Uploaded
bgruening
parents:
diff changeset
549 Bowtie 1 see -n).
221e740377ca Uploaded
bgruening
parents:
diff changeset
550
221e740377ca Uploaded
bgruening
parents:
diff changeset
551 -L INT Sets the length of the seed substrings to align during multiseed alignment. Smaller values
221e740377ca Uploaded
bgruening
parents:
diff changeset
552 make alignment slower but more senstive. Default: the --sensitive preset of Bowtie 2 is
221e740377ca Uploaded
bgruening
parents:
diff changeset
553 used by default, which sets -L to 20. This option is only available for Bowtie 2 (for
221e740377ca Uploaded
bgruening
parents:
diff changeset
554 Bowtie 1 see -l).
221e740377ca Uploaded
bgruening
parents:
diff changeset
555
221e740377ca Uploaded
bgruening
parents:
diff changeset
556 --ignore-quals When calculating a mismatch penalty, always consider the quality value at the mismatched
221e740377ca Uploaded
bgruening
parents:
diff changeset
557 position to be the highest possible, regardless of the actual value. I.e. input is treated
221e740377ca Uploaded
bgruening
parents:
diff changeset
558 as though all quality values are high. This is also the default behavior when the input
221e740377ca Uploaded
bgruening
parents:
diff changeset
559 doesn't specify quality values (e.g. in -f mode). This option is invariable and on by default.
221e740377ca Uploaded
bgruening
parents:
diff changeset
560
221e740377ca Uploaded
bgruening
parents:
diff changeset
561
221e740377ca Uploaded
bgruening
parents:
diff changeset
562 Bowtie 2 paired-end options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
563
221e740377ca Uploaded
bgruening
parents:
diff changeset
564 --no-mixed This option disables Bowtie 2's behavior to try to find alignments for the individual mates if
221e740377ca Uploaded
bgruening
parents:
diff changeset
565 it cannot find a concordant or discordant alignment for a pair. This option is invariable and
221e740377ca Uploaded
bgruening
parents:
diff changeset
566 and on by default.
221e740377ca Uploaded
bgruening
parents:
diff changeset
567
221e740377ca Uploaded
bgruening
parents:
diff changeset
568 --no-discordant Normally, Bowtie 2 looks for discordant alignments if it cannot find any concordant alignments.
221e740377ca Uploaded
bgruening
parents:
diff changeset
569 A discordant alignment is an alignment where both mates align uniquely, but that does not
221e740377ca Uploaded
bgruening
parents:
diff changeset
570 satisfy the paired-end constraints (--fr/--rf/--ff, -I, -X). This option disables that behavior
221e740377ca Uploaded
bgruening
parents:
diff changeset
571 and it is on by default.
221e740377ca Uploaded
bgruening
parents:
diff changeset
572
221e740377ca Uploaded
bgruening
parents:
diff changeset
573
221e740377ca Uploaded
bgruening
parents:
diff changeset
574 Bowtie 2 effort options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
575
221e740377ca Uploaded
bgruening
parents:
diff changeset
576 -D INT Up to INT consecutive seed extension attempts can "fail" before Bowtie 2 moves on, using
221e740377ca Uploaded
bgruening
parents:
diff changeset
577 the alignments found so far. A seed extension "fails" if it does not yield a new best or a
221e740377ca Uploaded
bgruening
parents:
diff changeset
578 new second-best alignment. Default: 15.
221e740377ca Uploaded
bgruening
parents:
diff changeset
579
221e740377ca Uploaded
bgruening
parents:
diff changeset
580 -R INT INT is the maximum number of times Bowtie 2 will "re-seed" reads with repetitive seeds.
221e740377ca Uploaded
bgruening
parents:
diff changeset
581 When "re-seeding," Bowtie 2 simply chooses a new set of reads (same length, same number of
221e740377ca Uploaded
bgruening
parents:
diff changeset
582 mismatches allowed) at different offsets and searches for more alignments. A read is considered
221e740377ca Uploaded
bgruening
parents:
diff changeset
583 to have repetitive seeds if the total number of seed hits divided by the number of seeds
221e740377ca Uploaded
bgruening
parents:
diff changeset
584 that aligned at least once is greater than 300. Default: 2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
585
221e740377ca Uploaded
bgruening
parents:
diff changeset
586
221e740377ca Uploaded
bgruening
parents:
diff changeset
587 Bowtie 2 Scoring options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
588
221e740377ca Uploaded
bgruening
parents:
diff changeset
589 --score_min "func" Sets a function governing the minimum alignment score needed for an alignment to be considered
221e740377ca Uploaded
bgruening
parents:
diff changeset
590 "valid" (i.e. good enough to report). This is a function of read length. For instance, specifying
221e740377ca Uploaded
bgruening
parents:
diff changeset
591 L,0,-0.2 sets the minimum-score function f to f(x) = 0 + -0.2 * x, where x is the read length.
221e740377ca Uploaded
bgruening
parents:
diff changeset
592 See also: setting function options at http://bowtie-bio.sourceforge.net/bowtie2. The default is
221e740377ca Uploaded
bgruening
parents:
diff changeset
593 L,0,-0.2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
594
221e740377ca Uploaded
bgruening
parents:
diff changeset
595
221e740377ca Uploaded
bgruening
parents:
diff changeset
596 Bowtie 2 Reporting options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
597
221e740377ca Uploaded
bgruening
parents:
diff changeset
598 --most_valid_alignments INT This used to be the Bowtie 2 parameter -M. As of Bowtie 2 version 2.0.0 beta7 the option -M is
221e740377ca Uploaded
bgruening
parents:
diff changeset
599 deprecated. It will be removed in subsequent versions. What used to be called -M mode is still the
221e740377ca Uploaded
bgruening
parents:
diff changeset
600 default mode, but adjusting the -M setting is deprecated. Use the -D and -R options to adjust the
221e740377ca Uploaded
bgruening
parents:
diff changeset
601 effort expended to find valid alignments.
221e740377ca Uploaded
bgruening
parents:
diff changeset
602
221e740377ca Uploaded
bgruening
parents:
diff changeset
603 For reference, this used to be the old (now deprecated) description of -M:
221e740377ca Uploaded
bgruening
parents:
diff changeset
604 Bowtie 2 searches for at most INT+1 distinct, valid alignments for each read. The search terminates when it
221e740377ca Uploaded
bgruening
parents:
diff changeset
605 can't find more distinct valid alignments, or when it finds INT+1 distinct alignments, whichever
221e740377ca Uploaded
bgruening
parents:
diff changeset
606 happens first. Only the best alignment is reported. Information from the other alignments is used to
221e740377ca Uploaded
bgruening
parents:
diff changeset
607 estimate mapping quality and to set SAM optional fields, such as AS:i and XS:i. Increasing -M makes
221e740377ca Uploaded
bgruening
parents:
diff changeset
608 Bowtie 2 slower, but increases the likelihood that it will pick the correct alignment for a read that
221e740377ca Uploaded
bgruening
parents:
diff changeset
609 aligns many places. For reads that have more than INT+1 distinct, valid alignments, Bowtie 2 does not
221e740377ca Uploaded
bgruening
parents:
diff changeset
610 guarantee that the alignment reported is the best possible in terms of alignment score. -M is
221e740377ca Uploaded
bgruening
parents:
diff changeset
611 always used and its default value is set to 10.
221e740377ca Uploaded
bgruening
parents:
diff changeset
612
221e740377ca Uploaded
bgruening
parents:
diff changeset
613 </help>
221e740377ca Uploaded
bgruening
parents:
diff changeset
614 </tool>