annotate bismark_bowtie_wrapper.xml @ 17:73508c5b4273 draft

Uploaded
author bgruening
date Sun, 24 Feb 2013 14:49:36 -0500
parents 221e740377ca
children 862fb59a9a25
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
17
73508c5b4273 Uploaded
bgruening
parents: 9
diff changeset
1 <tool id="bismark_bowtie" name="Bismark" version="0.7.7.3">
9
221e740377ca Uploaded
bgruening
parents:
diff changeset
2 <!-- Wrapper compatible with Bismark version 0.7.7 -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
3 <description>bisulfite mapper (bowtie)</description>
221e740377ca Uploaded
bgruening
parents:
diff changeset
4 <!--<version_command>bismark version</version_command>-->
221e740377ca Uploaded
bgruening
parents:
diff changeset
5 <requirements>
221e740377ca Uploaded
bgruening
parents:
diff changeset
6 <requirement type="set_environment">SCRIPT_PATH</requirement>
221e740377ca Uploaded
bgruening
parents:
diff changeset
7 <requirement type="package" version="0.12.8">bowtie</requirement>
221e740377ca Uploaded
bgruening
parents:
diff changeset
8 <requirement type="package" version="2.0.0-beta7">bowtie2</requirement>
221e740377ca Uploaded
bgruening
parents:
diff changeset
9 </requirements>
221e740377ca Uploaded
bgruening
parents:
diff changeset
10 <parallelism method="basic"></parallelism>
221e740377ca Uploaded
bgruening
parents:
diff changeset
11 <command interpreter="python">
221e740377ca Uploaded
bgruening
parents:
diff changeset
12 bismark_wrapper.py
221e740377ca Uploaded
bgruening
parents:
diff changeset
13
221e740377ca Uploaded
bgruening
parents:
diff changeset
14 ## Change this to accommodate the number of threads you have available.
221e740377ca Uploaded
bgruening
parents:
diff changeset
15 --num-threads 4
221e740377ca Uploaded
bgruening
parents:
diff changeset
16
221e740377ca Uploaded
bgruening
parents:
diff changeset
17 --bismark_path \$SCRIPT_PATH
221e740377ca Uploaded
bgruening
parents:
diff changeset
18
221e740377ca Uploaded
bgruening
parents:
diff changeset
19 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
20 ## Bismark Genome Preparation, if desired.
221e740377ca Uploaded
bgruening
parents:
diff changeset
21 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
22
221e740377ca Uploaded
bgruening
parents:
diff changeset
23 ## Handle reference file.
221e740377ca Uploaded
bgruening
parents:
diff changeset
24 #if $refGenomeSource.genomeSource == "history":
221e740377ca Uploaded
bgruening
parents:
diff changeset
25 --own-file=$refGenomeSource.ownFile
221e740377ca Uploaded
bgruening
parents:
diff changeset
26 #else:
221e740377ca Uploaded
bgruening
parents:
diff changeset
27 --indexes-path ${refGenomeSource.index.fields.path}
221e740377ca Uploaded
bgruening
parents:
diff changeset
28 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
29
221e740377ca Uploaded
bgruening
parents:
diff changeset
30
221e740377ca Uploaded
bgruening
parents:
diff changeset
31 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
32 ## Input parameters
221e740377ca Uploaded
bgruening
parents:
diff changeset
33 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
34
221e740377ca Uploaded
bgruening
parents:
diff changeset
35
221e740377ca Uploaded
bgruening
parents:
diff changeset
36 #if $singlePaired.sPaired == "single":
221e740377ca Uploaded
bgruening
parents:
diff changeset
37 --single-paired $singlePaired.input_singles
221e740377ca Uploaded
bgruening
parents:
diff changeset
38
221e740377ca Uploaded
bgruening
parents:
diff changeset
39 #if $singlePaired.input_singles.ext == "fastqillumina":
221e740377ca Uploaded
bgruening
parents:
diff changeset
40 --phred64-quals
221e740377ca Uploaded
bgruening
parents:
diff changeset
41 --fastq
221e740377ca Uploaded
bgruening
parents:
diff changeset
42 #elif $singlePaired.input_singles.ext == "fastqsanger":
221e740377ca Uploaded
bgruening
parents:
diff changeset
43 --fastq
221e740377ca Uploaded
bgruening
parents:
diff changeset
44 #elif $singlePaired.input_singles.ext == "fasta":
221e740377ca Uploaded
bgruening
parents:
diff changeset
45 --fasta
221e740377ca Uploaded
bgruening
parents:
diff changeset
46 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
47 #else:
221e740377ca Uploaded
bgruening
parents:
diff changeset
48 --mate-paired
221e740377ca Uploaded
bgruening
parents:
diff changeset
49 --mate1 $singlePaired.input_mate1
221e740377ca Uploaded
bgruening
parents:
diff changeset
50 --mate2 $singlePaired.input_mate2
221e740377ca Uploaded
bgruening
parents:
diff changeset
51
221e740377ca Uploaded
bgruening
parents:
diff changeset
52 #if $singlePaired.input_mate1.ext == "fastqillumina":
221e740377ca Uploaded
bgruening
parents:
diff changeset
53 --phred64-quals
221e740377ca Uploaded
bgruening
parents:
diff changeset
54 --fastq
221e740377ca Uploaded
bgruening
parents:
diff changeset
55 #elif $singlePaired.input_mate1.ext == "fastqsanger":
221e740377ca Uploaded
bgruening
parents:
diff changeset
56 --fastq
221e740377ca Uploaded
bgruening
parents:
diff changeset
57 #elif $singlePaired.input_mate1.ext == "fasta":
221e740377ca Uploaded
bgruening
parents:
diff changeset
58 --fasta
221e740377ca Uploaded
bgruening
parents:
diff changeset
59 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
60
221e740377ca Uploaded
bgruening
parents:
diff changeset
61 -I $singlePaired.minInsert
221e740377ca Uploaded
bgruening
parents:
diff changeset
62 -X $singlePaired.maxInsert
221e740377ca Uploaded
bgruening
parents:
diff changeset
63 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
64
221e740377ca Uploaded
bgruening
parents:
diff changeset
65
221e740377ca Uploaded
bgruening
parents:
diff changeset
66 ## for now hardcode the value for the required memory per thread in --best mode
221e740377ca Uploaded
bgruening
parents:
diff changeset
67 --chunkmbs 512
221e740377ca Uploaded
bgruening
parents:
diff changeset
68
221e740377ca Uploaded
bgruening
parents:
diff changeset
69
221e740377ca Uploaded
bgruening
parents:
diff changeset
70 #if $params.settingsType == "custom":
221e740377ca Uploaded
bgruening
parents:
diff changeset
71
221e740377ca Uploaded
bgruening
parents:
diff changeset
72 ## default 20
221e740377ca Uploaded
bgruening
parents:
diff changeset
73 --seed-len $params.seed_len
221e740377ca Uploaded
bgruening
parents:
diff changeset
74 ## default 0
221e740377ca Uploaded
bgruening
parents:
diff changeset
75 --seed-mismatches $params.seed_mismatches
17
73508c5b4273 Uploaded
bgruening
parents: 9
diff changeset
76
9
221e740377ca Uploaded
bgruening
parents:
diff changeset
77 ## default 70
221e740377ca Uploaded
bgruening
parents:
diff changeset
78 ##--maqerr $params.maqerr
221e740377ca Uploaded
bgruening
parents:
diff changeset
79
221e740377ca Uploaded
bgruening
parents:
diff changeset
80 ## default unlimited
221e740377ca Uploaded
bgruening
parents:
diff changeset
81 #if $params.qupto != 0:
221e740377ca Uploaded
bgruening
parents:
diff changeset
82 --qupto $params.qupto
221e740377ca Uploaded
bgruening
parents:
diff changeset
83 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
84 #if $params.skip_reads != 0:
221e740377ca Uploaded
bgruening
parents:
diff changeset
85 --skip-reads $params.skip_reads
221e740377ca Uploaded
bgruening
parents:
diff changeset
86 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
87
221e740377ca Uploaded
bgruening
parents:
diff changeset
88 ###if str($params.isReportOutput) == "yes":
221e740377ca Uploaded
bgruening
parents:
diff changeset
89 ## --output-report-file $report_file
221e740377ca Uploaded
bgruening
parents:
diff changeset
90 ###end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
91
221e740377ca Uploaded
bgruening
parents:
diff changeset
92 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
93
221e740377ca Uploaded
bgruening
parents:
diff changeset
94 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
95 ## Output parameters.
221e740377ca Uploaded
bgruening
parents:
diff changeset
96 ##
221e740377ca Uploaded
bgruening
parents:
diff changeset
97 --output $output
221e740377ca Uploaded
bgruening
parents:
diff changeset
98 $suppress_header
221e740377ca Uploaded
bgruening
parents:
diff changeset
99
221e740377ca Uploaded
bgruening
parents:
diff changeset
100 #if str( $singlePaired.sPaired ) == "single"
221e740377ca Uploaded
bgruening
parents:
diff changeset
101 #if $output_unmapped_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
102 --output-unmapped-reads $output_unmapped_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
103 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
104 #if $output_suppressed_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
105 --output-suppressed-reads $output_suppressed_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
106 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
107 #else
221e740377ca Uploaded
bgruening
parents:
diff changeset
108 #if $output_unmapped_reads_l and $output_unmapped_reads_r
221e740377ca Uploaded
bgruening
parents:
diff changeset
109 --output-unmapped-reads-l $output_unmapped_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
110 --output-unmapped-reads-r $output_unmapped_reads_r
221e740377ca Uploaded
bgruening
parents:
diff changeset
111 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
112 #if $output_suppressed_reads_l and $output_suppressed_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
113 --output-suppressed-reads-l $output_suppressed_reads_l
221e740377ca Uploaded
bgruening
parents:
diff changeset
114 --output-suppressed-reads-r $output_suppressed_reads_r
221e740377ca Uploaded
bgruening
parents:
diff changeset
115 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
116 #end if
221e740377ca Uploaded
bgruening
parents:
diff changeset
117
221e740377ca Uploaded
bgruening
parents:
diff changeset
118 </command>
221e740377ca Uploaded
bgruening
parents:
diff changeset
119 <inputs>
221e740377ca Uploaded
bgruening
parents:
diff changeset
120 <conditional name="refGenomeSource">
221e740377ca Uploaded
bgruening
parents:
diff changeset
121 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options">
221e740377ca Uploaded
bgruening
parents:
diff changeset
122 <option value="indexed">Use a built-in index</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
123 <option value="history">Use one from the history</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
124 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
125 <when value="indexed">
221e740377ca Uploaded
bgruening
parents:
diff changeset
126 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact your Galaxy admin">
221e740377ca Uploaded
bgruening
parents:
diff changeset
127 <options from_data_table="bowtie_indexes">
221e740377ca Uploaded
bgruening
parents:
diff changeset
128 <filter type="sort_by" column="2"/>
221e740377ca Uploaded
bgruening
parents:
diff changeset
129 <validator type="no_options" message="No indexes are available for the selected input dataset"/>
221e740377ca Uploaded
bgruening
parents:
diff changeset
130 </options>
221e740377ca Uploaded
bgruening
parents:
diff changeset
131 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
132 </when> <!-- build-in -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
133 <when value="history">
221e740377ca Uploaded
bgruening
parents:
diff changeset
134 <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select the reference genome" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
135 </when> <!-- history -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
136 </conditional> <!-- refGenomeSource -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
137
221e740377ca Uploaded
bgruening
parents:
diff changeset
138 <!-- Input Parameters -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
139 <conditional name="singlePaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
140 <param name="sPaired" type="select" label="Is this library mate-paired?">
221e740377ca Uploaded
bgruening
parents:
diff changeset
141 <option value="single">Single-end</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
142 <option value="paired">Paired-end</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
143 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
144 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
145 <param name="input_singles" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
146 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
147 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
148 <param name="input_mate1" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
149 <param name="input_mate2" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
150 <param name="minInsert" type="integer" value="0" label="Minimum insert size for valid paired-end alignments" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
151 <param name="maxInsert" type="integer" value="250" label="Maximum insert size for valid paired-end alignments" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
152 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
153 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
154
221e740377ca Uploaded
bgruening
parents:
diff changeset
155
221e740377ca Uploaded
bgruening
parents:
diff changeset
156 <conditional name="params">
221e740377ca Uploaded
bgruening
parents:
diff changeset
157 <param name="settingsType" type="select" label="Bismark settings to use" help="You can use the default settings or set custom values for any of Bismark's parameters.">
221e740377ca Uploaded
bgruening
parents:
diff changeset
158 <option value="default">Use Defaults</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
159 <option value="custom">Full parameter list</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
160 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
161 <when value="default" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
162 <!-- Full/advanced params. -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
163 <when value="custom">
221e740377ca Uploaded
bgruening
parents:
diff changeset
164 <!-- -n -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
165 <param name="seed_mismatches" type="select" label="The maximum number of mismatches permitted in the 'seed'.">
221e740377ca Uploaded
bgruening
parents:
diff changeset
166 <option value="0">0</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
167 <option value="1">1</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
168 <option value="2" selected="true">2</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
169 <option value="3">3</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
170 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
171 <!-- -l -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
172 <param name="seed_len" type="integer" value="28" label="The 'seed length'; The number of bases of the high quality end of the read to which the maximum number of mismatches applies." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
173 <!--
221e740377ca Uploaded
bgruening
parents:
diff changeset
174 <param name="maqerr" type="integer" value="70" label="Maximum permitted total of quality values at all mismatched read positions throughout the entire alignment, not just in the 'seed'." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
175 -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
176 <param name="qupto" type="integer" value="0" label="Only aligns the first N reads or read pairs from the input" help="Default is 0 and means 'no-limit'." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
177 <param name="skip_reads" type="integer" value="0" label="Skip (i.e. do not align) the first N reads or read pairs from the input" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
178
221e740377ca Uploaded
bgruening
parents:
diff changeset
179 <param name="suppressed_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write ambiguous reads to an extra output file." help="Write all reads which produce more than one valid alignment with the same number of lowest mismatches or other reads that fail to align uniquely." />
221e740377ca Uploaded
bgruening
parents:
diff changeset
180 <param name="unmapped_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write all reads that could not be aligned to a file" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
181 <!-- output Options -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
182 <!--
221e740377ca Uploaded
bgruening
parents:
diff changeset
183 <param name="isReportOutput" type="select" label="Offer all report files concatenated in one file.">
221e740377ca Uploaded
bgruening
parents:
diff changeset
184 <option value="yes">yes</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
185 <option value="no">no</option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
186 </param>
221e740377ca Uploaded
bgruening
parents:
diff changeset
187 -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
188 <!--end output options -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
189 </when> <!-- full -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
190 </conditional> <!-- params -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
191 <param name="suppress_header" type="boolean" truevalue="--suppress-header" falsevalue="" checked="False" label="Suppress the header in the output SAM file" help="Bowtie produces SAM with several lines of header information by default" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
192 </inputs>
221e740377ca Uploaded
bgruening
parents:
diff changeset
193 <outputs>
221e740377ca Uploaded
bgruening
parents:
diff changeset
194 <!-- that does not work
221e740377ca Uploaded
bgruening
parents:
diff changeset
195 <data format="txt" name="report_file" label="${tool.name} on ${on_string}: Report">
221e740377ca Uploaded
bgruening
parents:
diff changeset
196 <filter>str($params.isReportOutput) == "yes"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
197 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
198 -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
199 <data format="sam" name="output" label="${tool.name} on ${on_string}: mapped reads">
221e740377ca Uploaded
bgruening
parents:
diff changeset
200 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
201 <conditional name="refGenomeSource.genomeSource">
221e740377ca Uploaded
bgruening
parents:
diff changeset
202 <when value="indexed">
221e740377ca Uploaded
bgruening
parents:
diff changeset
203 <action type="metadata" name="dbkey">
221e740377ca Uploaded
bgruening
parents:
diff changeset
204 <option type="from_data_table" name="bowtie2_indexes" column="1" offset="0">
221e740377ca Uploaded
bgruening
parents:
diff changeset
205 <filter type="param_value" column="0" value="#" compare="startswith" keep="False"/>
221e740377ca Uploaded
bgruening
parents:
diff changeset
206 <filter type="param_value" ref="refGenomeSource.index" column="0"/>
221e740377ca Uploaded
bgruening
parents:
diff changeset
207 </option>
221e740377ca Uploaded
bgruening
parents:
diff changeset
208 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
209 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
210 <when value="history">
221e740377ca Uploaded
bgruening
parents:
diff changeset
211 <action type="metadata" name="dbkey">
221e740377ca Uploaded
bgruening
parents:
diff changeset
212 <option type="from_param" name="refGenomeSource.ownFile" param_attribute="dbkey" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
213 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
214 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
215 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
216 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
217 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
218
221e740377ca Uploaded
bgruening
parents:
diff changeset
219 <data format="fastq" name="output_suppressed_reads_l" label="${tool.name} on ${on_string}: suppressed reads (L)">
221e740377ca Uploaded
bgruening
parents:
diff changeset
220 <filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
221 ((
221e740377ca Uploaded
bgruening
parents:
diff changeset
222 params['settingsType'] == "custom" and
221e740377ca Uploaded
bgruening
parents:
diff changeset
223 params['suppressed_read_file'] is True
221e740377ca Uploaded
bgruening
parents:
diff changeset
224 ))
221e740377ca Uploaded
bgruening
parents:
diff changeset
225 </filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
226 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
227 <conditional name="singlePaired.sPaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
228 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
229 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
230 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
231 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
232 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
233 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
234 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
235 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
236 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
237 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
238 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
239 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
240 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
241
221e740377ca Uploaded
bgruening
parents:
diff changeset
242 <data format="fastq" name="output_suppressed_reads_r" label="${tool.name} on ${on_string}: suppressed reads (R)">
221e740377ca Uploaded
bgruening
parents:
diff changeset
243 <filter>singlePaired['sPaired'] == "paired"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
244 <filter>params['settingsType'] == "custom"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
245 <filter>params['supressed_read_file'] is True</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
246 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
247 <conditional name="singlePaired.sPaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
248 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
249 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
250 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
251 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
252 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
253 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
254 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
255 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
256 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
257 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
258 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
259 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
260 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
261
221e740377ca Uploaded
bgruening
parents:
diff changeset
262 <!-- Outout unmapped reads -->
221e740377ca Uploaded
bgruening
parents:
diff changeset
263 <data format="fastq" name="output_unmapped_reads_l" label="${tool.name} on ${on_string}: unmapped reads (L)">
221e740377ca Uploaded
bgruening
parents:
diff changeset
264 <filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
265 ((
221e740377ca Uploaded
bgruening
parents:
diff changeset
266 params['settingsType'] == "custom" and
221e740377ca Uploaded
bgruening
parents:
diff changeset
267 params['unmapped_read_file'] is True
221e740377ca Uploaded
bgruening
parents:
diff changeset
268 ))
221e740377ca Uploaded
bgruening
parents:
diff changeset
269 </filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
270 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
271 <conditional name="singlePaired.sPaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
272 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
273 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
274 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
275 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
276 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
277 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
278 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
279 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
280 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
281 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
282 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
283 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
284 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
285 <data format="fastq" name="output_unmapped_reads_r" label="${tool.name} on ${on_string}: unmapped reads (R)">
221e740377ca Uploaded
bgruening
parents:
diff changeset
286 <filter>singlePaired['sPaired'] == "paired"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
287 <filter>params['settingsType'] == "custom"</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
288 <filter>params['unmapped_read_file'] is True</filter>
221e740377ca Uploaded
bgruening
parents:
diff changeset
289 <actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
290 <conditional name="singlePaired.sPaired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
291 <when value="single">
221e740377ca Uploaded
bgruening
parents:
diff changeset
292 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
293 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
294 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
295 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
296 <when value="paired">
221e740377ca Uploaded
bgruening
parents:
diff changeset
297 <action type="format">
221e740377ca Uploaded
bgruening
parents:
diff changeset
298 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
221e740377ca Uploaded
bgruening
parents:
diff changeset
299 </action>
221e740377ca Uploaded
bgruening
parents:
diff changeset
300 </when>
221e740377ca Uploaded
bgruening
parents:
diff changeset
301 </conditional>
221e740377ca Uploaded
bgruening
parents:
diff changeset
302 </actions>
221e740377ca Uploaded
bgruening
parents:
diff changeset
303 </data>
221e740377ca Uploaded
bgruening
parents:
diff changeset
304
221e740377ca Uploaded
bgruening
parents:
diff changeset
305
221e740377ca Uploaded
bgruening
parents:
diff changeset
306 </outputs>
221e740377ca Uploaded
bgruening
parents:
diff changeset
307
221e740377ca Uploaded
bgruening
parents:
diff changeset
308 <tests>
221e740377ca Uploaded
bgruening
parents:
diff changeset
309 </tests>
221e740377ca Uploaded
bgruening
parents:
diff changeset
310
221e740377ca Uploaded
bgruening
parents:
diff changeset
311 <help>
221e740377ca Uploaded
bgruening
parents:
diff changeset
312
221e740377ca Uploaded
bgruening
parents:
diff changeset
313 **What it does**
221e740377ca Uploaded
bgruening
parents:
diff changeset
314
221e740377ca Uploaded
bgruening
parents:
diff changeset
315 Bismark_ is a bisulfite mapper and methylation caller. Bismark takes in FastA or FastQ files and aligns the
221e740377ca Uploaded
bgruening
parents:
diff changeset
316 reads to a specified bisulfite genome. Sequence reads are transformed into a bisulfite converted forward strand
221e740377ca Uploaded
bgruening
parents:
diff changeset
317 version (C->T conversion) or into a bisulfite treated reverse strand (G->A conversion of the forward strand).
221e740377ca Uploaded
bgruening
parents:
diff changeset
318 Each of these reads are then aligned to bisulfite treated forward strand index of a reference genome
221e740377ca Uploaded
bgruening
parents:
diff changeset
319 (C->T converted) and a bisulfite treated reverse strand index of the genome (G->A conversion of the
221e740377ca Uploaded
bgruening
parents:
diff changeset
320 forward strand, by doing this alignments will produce the same positions). These 4 instances of Bowtie (1 or 2)
221e740377ca Uploaded
bgruening
parents:
diff changeset
321 are run in parallel. The sequence file(s) are then read in again sequence by sequence to pull out the original
221e740377ca Uploaded
bgruening
parents:
diff changeset
322 sequence from the genome and determine if there were any protected C's present or not.
221e740377ca Uploaded
bgruening
parents:
diff changeset
323
221e740377ca Uploaded
bgruening
parents:
diff changeset
324 .. _Bismark: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
221e740377ca Uploaded
bgruening
parents:
diff changeset
325
221e740377ca Uploaded
bgruening
parents:
diff changeset
326 As of version 0.7.0 Bismark will only run 2 alignment threads for OT and OB in parallel, the 4 strand mode can be
221e740377ca Uploaded
bgruening
parents:
diff changeset
327 re-enabled by using non_directional mode.
221e740377ca Uploaded
bgruening
parents:
diff changeset
328
221e740377ca Uploaded
bgruening
parents:
diff changeset
329 It is developed by Krueger F and Andrews SR. at the Babraham Institute. Krueger F, Andrews SR. (2011) Bismark: a flexible aligner and methylation caller for Bisulfite-Seq applications. Bioinformatics, 27, 1571-2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
330
221e740377ca Uploaded
bgruening
parents:
diff changeset
331 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
332
221e740377ca Uploaded
bgruening
parents:
diff changeset
333 **Know what you are doing**
221e740377ca Uploaded
bgruening
parents:
diff changeset
334
221e740377ca Uploaded
bgruening
parents:
diff changeset
335 .. class:: warningmark
221e740377ca Uploaded
bgruening
parents:
diff changeset
336
221e740377ca Uploaded
bgruening
parents:
diff changeset
337 There is no such thing (yet) as an automated gearshift in short read mapping. It is all like stick-shift driving in San Francisco. In other words = running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy.
221e740377ca Uploaded
bgruening
parents:
diff changeset
338
221e740377ca Uploaded
bgruening
parents:
diff changeset
339 .. __: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
221e740377ca Uploaded
bgruening
parents:
diff changeset
340
221e740377ca Uploaded
bgruening
parents:
diff changeset
341 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
342
221e740377ca Uploaded
bgruening
parents:
diff changeset
343 **Input formats**
221e740377ca Uploaded
bgruening
parents:
diff changeset
344
221e740377ca Uploaded
bgruening
parents:
diff changeset
345 Bismark accepts files in either Sanger FASTQ format (galaxy type *fastqsanger*), Illumina FASTQ format (galaxy type *fastqillumina*) or FASTA format (galaxy type *fasta*). Use the FASTQ Groomer to prepare your files.
221e740377ca Uploaded
bgruening
parents:
diff changeset
346
221e740377ca Uploaded
bgruening
parents:
diff changeset
347 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
348
221e740377ca Uploaded
bgruening
parents:
diff changeset
349 **A Note on Built-in Reference Genomes**
221e740377ca Uploaded
bgruening
parents:
diff changeset
350
221e740377ca Uploaded
bgruening
parents:
diff changeset
351 The default variant for all genomes is "Full", defined as all primary chromosomes (or scaffolds/contigs) including mitochondrial plus associated unmapped, plasmid, and other segments. When only one version of a genome is available in this tool, it represents the default "Full" variant. Some genomes will have more than one variant available. The "Canonical Male" or sometimes simply "Canonical" variant contains the primary chromosomes for a genome. For example a human "Canonical" variant contains chr1-chr22, chrX, chrY, and chrM. The "Canonical Female" variant contains the primary chromosomes excluding chrY.
221e740377ca Uploaded
bgruening
parents:
diff changeset
352
221e740377ca Uploaded
bgruening
parents:
diff changeset
353 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
354
221e740377ca Uploaded
bgruening
parents:
diff changeset
355 The final output of Bismark is in SAM format by default.
221e740377ca Uploaded
bgruening
parents:
diff changeset
356
221e740377ca Uploaded
bgruening
parents:
diff changeset
357 **Outputs**
221e740377ca Uploaded
bgruening
parents:
diff changeset
358
221e740377ca Uploaded
bgruening
parents:
diff changeset
359 The output is in SAM format, and has the following columns::
221e740377ca Uploaded
bgruening
parents:
diff changeset
360
221e740377ca Uploaded
bgruening
parents:
diff changeset
361 Column Description
221e740377ca Uploaded
bgruening
parents:
diff changeset
362 -------- --------------------------------------------------------
221e740377ca Uploaded
bgruening
parents:
diff changeset
363 1 QNAME seq-ID
221e740377ca Uploaded
bgruening
parents:
diff changeset
364 2 FLAG this flag tries to take the strand a bisulfite read
221e740377ca Uploaded
bgruening
parents:
diff changeset
365 originated from into account
221e740377ca Uploaded
bgruening
parents:
diff changeset
366 (this is different from ordinary DNA alignment flags!)
221e740377ca Uploaded
bgruening
parents:
diff changeset
367 3 RNAME chromosome
221e740377ca Uploaded
bgruening
parents:
diff changeset
368 4 POS start position
221e740377ca Uploaded
bgruening
parents:
diff changeset
369 5 MAPQ always 255
221e740377ca Uploaded
bgruening
parents:
diff changeset
370 6 CIGAR extended CIGAR string
221e740377ca Uploaded
bgruening
parents:
diff changeset
371 7 MRNM Mate Reference sequence NaMe ('=' if same as RNAME)
221e740377ca Uploaded
bgruening
parents:
diff changeset
372 8 MPOS 1-based Mate POSition
221e740377ca Uploaded
bgruening
parents:
diff changeset
373 9 ISIZE Inferred insert SIZE
221e740377ca Uploaded
bgruening
parents:
diff changeset
374 10 SEQ query SEQuence on the same strand as the reference
221e740377ca Uploaded
bgruening
parents:
diff changeset
375 11 QUAL Phred33 scale
221e740377ca Uploaded
bgruening
parents:
diff changeset
376 12 NM-tag edit distance to the reference)
221e740377ca Uploaded
bgruening
parents:
diff changeset
377 13 XX-tag base-by-base mismatches to the reference.
221e740377ca Uploaded
bgruening
parents:
diff changeset
378 This does not include indels.
221e740377ca Uploaded
bgruening
parents:
diff changeset
379 14 XM-tag methylation call string
221e740377ca Uploaded
bgruening
parents:
diff changeset
380 15 XR-tag read conversion state for the alignment
221e740377ca Uploaded
bgruening
parents:
diff changeset
381 16 XG-tag genome conversion state for the alignment
221e740377ca Uploaded
bgruening
parents:
diff changeset
382
221e740377ca Uploaded
bgruening
parents:
diff changeset
383
221e740377ca Uploaded
bgruening
parents:
diff changeset
384 Each read of paired-end alignments is written out in a separate line in the above format.
221e740377ca Uploaded
bgruening
parents:
diff changeset
385
221e740377ca Uploaded
bgruening
parents:
diff changeset
386
221e740377ca Uploaded
bgruening
parents:
diff changeset
387 It looks like this (scroll sideways to see the entire example)::
221e740377ca Uploaded
bgruening
parents:
diff changeset
388
221e740377ca Uploaded
bgruening
parents:
diff changeset
389 QNAME FLAG RNAME POS MAPQ CIAGR MRNM MPOS ISIZE SEQ QUAL OPT
221e740377ca Uploaded
bgruening
parents:
diff changeset
390 HWI-EAS91_1_30788AAXX:1:1:1761:343 4 * 0 0 * * 0 0 AAAAAAANNAAAAAAAAAAAAAAAAAAAAAAAAAAACNNANNGAGTNGNNNNNNNGCTTCCCACAGNNCTGG hhhhhhh;;hhhhhhhhhhh^hOhhhhghhhfhhhgh;;h;;hhhh;h;;;;;;;hhhhhhghhhh;;Phhh
221e740377ca Uploaded
bgruening
parents:
diff changeset
391 HWI-EAS91_1_30788AAXX:1:1:1578:331 4 * 0 0 * * 0 0 GTATAGANNAATAAGAAAAAAAAAAATGAAGACTTTCNNANNTCTGNANNNNNNNTCTTTTTTCAGNNGTAG hhhhhhh;;hhhhhhhhhhhhhhhhhhhhhhhhhhhh;;h;;hhhh;h;;;;;;;hhhhhhhhhhh;;hhVh
221e740377ca Uploaded
bgruening
parents:
diff changeset
392
221e740377ca Uploaded
bgruening
parents:
diff changeset
393 -------
221e740377ca Uploaded
bgruening
parents:
diff changeset
394
221e740377ca Uploaded
bgruening
parents:
diff changeset
395 **Bismark settings**
221e740377ca Uploaded
bgruening
parents:
diff changeset
396
221e740377ca Uploaded
bgruening
parents:
diff changeset
397 All of the options have a default value. You can change any of them. If any Bismark function is missing please contact the tool author or your Galaxy admin.
221e740377ca Uploaded
bgruening
parents:
diff changeset
398
221e740377ca Uploaded
bgruening
parents:
diff changeset
399 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
400
221e740377ca Uploaded
bgruening
parents:
diff changeset
401 **Bismark parameter list**
221e740377ca Uploaded
bgruening
parents:
diff changeset
402
221e740377ca Uploaded
bgruening
parents:
diff changeset
403 This is an exhaustive list of Bismark options:
221e740377ca Uploaded
bgruening
parents:
diff changeset
404
221e740377ca Uploaded
bgruening
parents:
diff changeset
405 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
406
221e740377ca Uploaded
bgruening
parents:
diff changeset
407 **OPTIONS**
221e740377ca Uploaded
bgruening
parents:
diff changeset
408
221e740377ca Uploaded
bgruening
parents:
diff changeset
409
221e740377ca Uploaded
bgruening
parents:
diff changeset
410 Input::
221e740377ca Uploaded
bgruening
parents:
diff changeset
411
221e740377ca Uploaded
bgruening
parents:
diff changeset
412 --singles A comma- or space-separated list of files containing the reads to be aligned (e.g.
221e740377ca Uploaded
bgruening
parents:
diff changeset
413 lane1.fq,lane2.fq lane3.fq). Reads may be a mix of different lengths. Bismark will
221e740377ca Uploaded
bgruening
parents:
diff changeset
414 produce one mapping result and one report file per input file.
221e740377ca Uploaded
bgruening
parents:
diff changeset
415
221e740377ca Uploaded
bgruening
parents:
diff changeset
416 -1 mates1 Comma-separated list of files containing the #1 mates (filename usually includes
221e740377ca Uploaded
bgruening
parents:
diff changeset
417 "_1"), e.g. flyA_1.fq,flyB_1.fq). Sequences specified with this option must
221e740377ca Uploaded
bgruening
parents:
diff changeset
418 correspond file-for-file and read-for-read with those specified in mates2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
419 Reads may be a mix of different lengths. Bismark will produce one mapping result
221e740377ca Uploaded
bgruening
parents:
diff changeset
420 and one report file per paired-end input file pair.
221e740377ca Uploaded
bgruening
parents:
diff changeset
421
221e740377ca Uploaded
bgruening
parents:
diff changeset
422 -2 mates2 Comma-separated list of files containing the #2 mates (filename usually includes
221e740377ca Uploaded
bgruening
parents:
diff changeset
423 "_2"), e.g. flyA_1.fq,flyB_1.fq). Sequences specified with this option must
221e740377ca Uploaded
bgruening
parents:
diff changeset
424 correspond file-for-file and read-for-read with those specified in mates1.
221e740377ca Uploaded
bgruening
parents:
diff changeset
425 Reads may be a mix of different lengths.
221e740377ca Uploaded
bgruening
parents:
diff changeset
426
221e740377ca Uploaded
bgruening
parents:
diff changeset
427 -q/--fastq The query input files (specified as mate1,mate2 or singles are FASTQ
221e740377ca Uploaded
bgruening
parents:
diff changeset
428 files (usually having extension .fg or .fastq). This is the default. See also
221e740377ca Uploaded
bgruening
parents:
diff changeset
429 --solexa-quals.
221e740377ca Uploaded
bgruening
parents:
diff changeset
430
221e740377ca Uploaded
bgruening
parents:
diff changeset
431 -f/--fasta The query input files (specified as mate1,mate2 or singles are FASTA
221e740377ca Uploaded
bgruening
parents:
diff changeset
432 files (usually havin extension .fa, .mfa, .fna or similar). All quality values
221e740377ca Uploaded
bgruening
parents:
diff changeset
433 are assumed to be 40 on the Phred scale.
221e740377ca Uploaded
bgruening
parents:
diff changeset
434
221e740377ca Uploaded
bgruening
parents:
diff changeset
435 -s/--skip INT Skip (i.e. do not align) the first INT reads or read pairs from the input.
221e740377ca Uploaded
bgruening
parents:
diff changeset
436
221e740377ca Uploaded
bgruening
parents:
diff changeset
437 -u/--upto INT Only aligns the first INT reads or read pairs from the input. Default: no limit.
221e740377ca Uploaded
bgruening
parents:
diff changeset
438
221e740377ca Uploaded
bgruening
parents:
diff changeset
439 --phred33-quals FASTQ qualities are ASCII chars equal to the Phred quality plus 33. Default: on.
221e740377ca Uploaded
bgruening
parents:
diff changeset
440
221e740377ca Uploaded
bgruening
parents:
diff changeset
441 --phred64-quals FASTQ qualities are ASCII chars equal to the Phred quality plus 64. Default: off.
221e740377ca Uploaded
bgruening
parents:
diff changeset
442
221e740377ca Uploaded
bgruening
parents:
diff changeset
443 --solexa-quals Convert FASTQ qualities from solexa-scaled (which can be negative) to phred-scaled
221e740377ca Uploaded
bgruening
parents:
diff changeset
444 (which can't). The formula for conversion is:
221e740377ca Uploaded
bgruening
parents:
diff changeset
445 phred-qual = 10 * log(1 + 10 ** (solexa-qual/10.0)) / log(10). Used with -q. This
221e740377ca Uploaded
bgruening
parents:
diff changeset
446 is usually the right option for use with (unconverted) reads emitted by the GA
221e740377ca Uploaded
bgruening
parents:
diff changeset
447 Pipeline versions prior to 1.3. Works only for Bowtie 1. Default: off.
221e740377ca Uploaded
bgruening
parents:
diff changeset
448
221e740377ca Uploaded
bgruening
parents:
diff changeset
449 --solexa1.3-quals Same as --phred64-quals. This is usually the right option for use with (unconverted)
221e740377ca Uploaded
bgruening
parents:
diff changeset
450 reads emitted by GA Pipeline version 1.3 or later. Default: off.
221e740377ca Uploaded
bgruening
parents:
diff changeset
451
221e740377ca Uploaded
bgruening
parents:
diff changeset
452
221e740377ca Uploaded
bgruening
parents:
diff changeset
453 Alignment::
221e740377ca Uploaded
bgruening
parents:
diff changeset
454
221e740377ca Uploaded
bgruening
parents:
diff changeset
455 -n/--seedmms INT The maximum number of mismatches permitted in the "seed", i.e. the first L base pairs
221e740377ca Uploaded
bgruening
parents:
diff changeset
456 of the read (where L is set with -l/--seedlen). This may be 0, 1, 2 or 3 and the
221e740377ca Uploaded
bgruening
parents:
diff changeset
457 default is 1. This option is only available for Bowtie 1 (for Bowtie 2 see -N).
221e740377ca Uploaded
bgruening
parents:
diff changeset
458
221e740377ca Uploaded
bgruening
parents:
diff changeset
459 -l/--seedlen The "seed length"; i.e., the number of bases of the high quality end of the read to
221e740377ca Uploaded
bgruening
parents:
diff changeset
460 which the -n ceiling applies. The default is 28. Bowtie (and thus Bismark) is faster for
221e740377ca Uploaded
bgruening
parents:
diff changeset
461 larger values of -l. This option is only available for Bowtie 1 (for Bowtie 2 see -L).
221e740377ca Uploaded
bgruening
parents:
diff changeset
462
221e740377ca Uploaded
bgruening
parents:
diff changeset
463 -e/--maqerr INT Maximum permitted total of quality values at all mismatched read positions throughout
221e740377ca Uploaded
bgruening
parents:
diff changeset
464 the entire alignment, not just in the "seed". The default is 70. Like Maq, bowtie rounds
221e740377ca Uploaded
bgruening
parents:
diff changeset
465 quality values to the nearest 10 and saturates at 30. This value is not relevant for
221e740377ca Uploaded
bgruening
parents:
diff changeset
466 Bowtie 2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
467
221e740377ca Uploaded
bgruening
parents:
diff changeset
468 --chunkmbs INT The number of megabytes of memory a given thread is given to store path descriptors in
221e740377ca Uploaded
bgruening
parents:
diff changeset
469 --best mode. Best-first search must keep track of many paths at once to ensure it is
221e740377ca Uploaded
bgruening
parents:
diff changeset
470 always extending the path with the lowest cumulative cost. Bowtie tries to minimize the
221e740377ca Uploaded
bgruening
parents:
diff changeset
471 memory impact of the descriptors, but they can still grow very large in some cases. If
221e740377ca Uploaded
bgruening
parents:
diff changeset
472 you receive an error message saying that chunk memory has been exhausted in --best mode,
221e740377ca Uploaded
bgruening
parents:
diff changeset
473 try adjusting this parameter up to dedicate more memory to the descriptors. This value
221e740377ca Uploaded
bgruening
parents:
diff changeset
474 is not relevant for Bowtie 2. Default: 512.
221e740377ca Uploaded
bgruening
parents:
diff changeset
475
221e740377ca Uploaded
bgruening
parents:
diff changeset
476 -I/--minins INT The minimum insert size for valid paired-end alignments. E.g. if -I 60 is specified and
221e740377ca Uploaded
bgruening
parents:
diff changeset
477 a paired-end alignment consists of two 20-bp alignments in the appropriate orientation
221e740377ca Uploaded
bgruening
parents:
diff changeset
478 with a 20-bp gap between them, that alignment is considered valid (as long as -X is also
221e740377ca Uploaded
bgruening
parents:
diff changeset
479 satisfied). A 19-bp gap would not be valid in that case. Default: 0.
221e740377ca Uploaded
bgruening
parents:
diff changeset
480
221e740377ca Uploaded
bgruening
parents:
diff changeset
481 -X/--maxins INT The maximum insert size for valid paired-end alignments. E.g. if -X 100 is specified and
221e740377ca Uploaded
bgruening
parents:
diff changeset
482 a paired-end alignment consists of two 20-bp alignments in the proper orientation with a
221e740377ca Uploaded
bgruening
parents:
diff changeset
483 60-bp gap between them, that alignment is considered valid (as long as -I is also satisfied).
221e740377ca Uploaded
bgruening
parents:
diff changeset
484 A 61-bp gap would not be valid in that case. Default: 500.
221e740377ca Uploaded
bgruening
parents:
diff changeset
485
221e740377ca Uploaded
bgruening
parents:
diff changeset
486
221e740377ca Uploaded
bgruening
parents:
diff changeset
487
221e740377ca Uploaded
bgruening
parents:
diff changeset
488 Output::
221e740377ca Uploaded
bgruening
parents:
diff changeset
489
221e740377ca Uploaded
bgruening
parents:
diff changeset
490 --non_directional The sequencing library was constructed in a non strand-specific manner, alignments to all four
221e740377ca Uploaded
bgruening
parents:
diff changeset
491 bisulfite strands will be reported. Default: OFF.
221e740377ca Uploaded
bgruening
parents:
diff changeset
492
221e740377ca Uploaded
bgruening
parents:
diff changeset
493 (The current Illumina protocol for BS-Seq is directional, in which case the strands complementary
221e740377ca Uploaded
bgruening
parents:
diff changeset
494 to the original strands are merely theoretical and should not exist in reality. Specifying directional
221e740377ca Uploaded
bgruening
parents:
diff changeset
495 alignments (which is the default) will only run 2 alignment threads to the original top (OT)
221e740377ca Uploaded
bgruening
parents:
diff changeset
496 or bottom (OB) strands in parallel and report these alignments. This is the recommended option
221e740377ca Uploaded
bgruening
parents:
diff changeset
497 for sprand-specific libraries).
221e740377ca Uploaded
bgruening
parents:
diff changeset
498
221e740377ca Uploaded
bgruening
parents:
diff changeset
499 --sam-no-hd Suppress SAM header lines (starting with @). This might be useful when very large input files are
221e740377ca Uploaded
bgruening
parents:
diff changeset
500 split up into several smaller files to run concurrently and the output files are to be merged.
221e740377ca Uploaded
bgruening
parents:
diff changeset
501
221e740377ca Uploaded
bgruening
parents:
diff changeset
502 --quiet Print nothing besides alignments.
221e740377ca Uploaded
bgruening
parents:
diff changeset
503
221e740377ca Uploaded
bgruening
parents:
diff changeset
504 --vanilla Performs bisulfite mapping with Bowtie 1 and prints the 'old' output (as in Bismark 0.5.X) instead
221e740377ca Uploaded
bgruening
parents:
diff changeset
505 of SAM format output.
221e740377ca Uploaded
bgruening
parents:
diff changeset
506
221e740377ca Uploaded
bgruening
parents:
diff changeset
507 -un/--unmapped Write all reads that could not be aligned to a file in the output directory. Written reads will
221e740377ca Uploaded
bgruening
parents:
diff changeset
508 appear as they did in the input, without any translation of quality values that may have
221e740377ca Uploaded
bgruening
parents:
diff changeset
509 taken place within Bowtie or Bismark. Paired-end reads will be written to two parallel files with _1
221e740377ca Uploaded
bgruening
parents:
diff changeset
510 and _2 inserted in their filenames, i.e. _unmapped_reads_1.txt and unmapped_reads_2.txt. Reads
221e740377ca Uploaded
bgruening
parents:
diff changeset
511 with more than one valid alignment with the same number of lowest mismatches (ambiguous mapping)
221e740377ca Uploaded
bgruening
parents:
diff changeset
512 are also written to _unmapped_reads.txt unless the option --ambiguous is specified as well.
221e740377ca Uploaded
bgruening
parents:
diff changeset
513
221e740377ca Uploaded
bgruening
parents:
diff changeset
514 --ambiguous Write all reads which produce more than one valid alignment with the same number of lowest
221e740377ca Uploaded
bgruening
parents:
diff changeset
515 mismatches or other reads that fail to align uniquely to a file in the output directory.
221e740377ca Uploaded
bgruening
parents:
diff changeset
516 Written reads will appear as they did in the input, without any of the translation of quality
221e740377ca Uploaded
bgruening
parents:
diff changeset
517 values that may have taken place within Bowtie or Bismark. Paired-end reads will be written to two
221e740377ca Uploaded
bgruening
parents:
diff changeset
518 parallel files with _1 and _2 inserted in theit filenames, i.e. _ambiguous_reads_1.txt and
221e740377ca Uploaded
bgruening
parents:
diff changeset
519 _ambiguous_reads_2.txt. These reads are not written to the file specified with --un.
221e740377ca Uploaded
bgruening
parents:
diff changeset
520
221e740377ca Uploaded
bgruening
parents:
diff changeset
521 -o/--output_dir DIR Write all output files into this directory. By default the output files will be written into
221e740377ca Uploaded
bgruening
parents:
diff changeset
522 the same folder as the input file(s). If the specified folder does not exist, Bismark will attempt
221e740377ca Uploaded
bgruening
parents:
diff changeset
523 to create it first. The path to the output folder can be either relative or absolute.
221e740377ca Uploaded
bgruening
parents:
diff changeset
524
221e740377ca Uploaded
bgruening
parents:
diff changeset
525 --temp_dir DIR Write temporary files to this directory instead of into the same directory as the input files. If
221e740377ca Uploaded
bgruening
parents:
diff changeset
526 the specified folder does not exist, Bismark will attempt to create it first. The path to the
221e740377ca Uploaded
bgruening
parents:
diff changeset
527 temporary folder can be either relative or absolute.
221e740377ca Uploaded
bgruening
parents:
diff changeset
528
221e740377ca Uploaded
bgruening
parents:
diff changeset
529 ------
221e740377ca Uploaded
bgruening
parents:
diff changeset
530
221e740377ca Uploaded
bgruening
parents:
diff changeset
531 Bowtie 2 alignment options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
532
221e740377ca Uploaded
bgruening
parents:
diff changeset
533 -N INT Sets the number of mismatches to allowed in a seed alignment during multiseed alignment.
221e740377ca Uploaded
bgruening
parents:
diff changeset
534 Can be set to 0 or 1. Setting this higher makes alignment slower (often much slower)
221e740377ca Uploaded
bgruening
parents:
diff changeset
535 but increases sensitivity. Default: 0. This option is only available for Bowtie 2 (for
221e740377ca Uploaded
bgruening
parents:
diff changeset
536 Bowtie 1 see -n).
221e740377ca Uploaded
bgruening
parents:
diff changeset
537
221e740377ca Uploaded
bgruening
parents:
diff changeset
538 -L INT Sets the length of the seed substrings to align during multiseed alignment. Smaller values
221e740377ca Uploaded
bgruening
parents:
diff changeset
539 make alignment slower but more senstive. Default: the --sensitive preset of Bowtie 2 is
221e740377ca Uploaded
bgruening
parents:
diff changeset
540 used by default, which sets -L to 20. This option is only available for Bowtie 2 (for
221e740377ca Uploaded
bgruening
parents:
diff changeset
541 Bowtie 1 see -l).
221e740377ca Uploaded
bgruening
parents:
diff changeset
542
221e740377ca Uploaded
bgruening
parents:
diff changeset
543 --ignore-quals When calculating a mismatch penalty, always consider the quality value at the mismatched
221e740377ca Uploaded
bgruening
parents:
diff changeset
544 position to be the highest possible, regardless of the actual value. I.e. input is treated
221e740377ca Uploaded
bgruening
parents:
diff changeset
545 as though all quality values are high. This is also the default behavior when the input
221e740377ca Uploaded
bgruening
parents:
diff changeset
546 doesn't specify quality values (e.g. in -f mode). This option is invariable and on by default.
221e740377ca Uploaded
bgruening
parents:
diff changeset
547
221e740377ca Uploaded
bgruening
parents:
diff changeset
548
221e740377ca Uploaded
bgruening
parents:
diff changeset
549 Bowtie 2 paired-end options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
550
221e740377ca Uploaded
bgruening
parents:
diff changeset
551 --no-mixed This option disables Bowtie 2's behavior to try to find alignments for the individual mates if
221e740377ca Uploaded
bgruening
parents:
diff changeset
552 it cannot find a concordant or discordant alignment for a pair. This option is invariable and
221e740377ca Uploaded
bgruening
parents:
diff changeset
553 and on by default.
221e740377ca Uploaded
bgruening
parents:
diff changeset
554
221e740377ca Uploaded
bgruening
parents:
diff changeset
555 --no-discordant Normally, Bowtie 2 looks for discordant alignments if it cannot find any concordant alignments.
221e740377ca Uploaded
bgruening
parents:
diff changeset
556 A discordant alignment is an alignment where both mates align uniquely, but that does not
221e740377ca Uploaded
bgruening
parents:
diff changeset
557 satisfy the paired-end constraints (--fr/--rf/--ff, -I, -X). This option disables that behavior
221e740377ca Uploaded
bgruening
parents:
diff changeset
558 and it is on by default.
221e740377ca Uploaded
bgruening
parents:
diff changeset
559
221e740377ca Uploaded
bgruening
parents:
diff changeset
560
221e740377ca Uploaded
bgruening
parents:
diff changeset
561 Bowtie 2 effort options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
562
221e740377ca Uploaded
bgruening
parents:
diff changeset
563 -D INT Up to INT consecutive seed extension attempts can "fail" before Bowtie 2 moves on, using
221e740377ca Uploaded
bgruening
parents:
diff changeset
564 the alignments found so far. A seed extension "fails" if it does not yield a new best or a
221e740377ca Uploaded
bgruening
parents:
diff changeset
565 new second-best alignment. Default: 15.
221e740377ca Uploaded
bgruening
parents:
diff changeset
566
221e740377ca Uploaded
bgruening
parents:
diff changeset
567 -R INT INT is the maximum number of times Bowtie 2 will "re-seed" reads with repetitive seeds.
221e740377ca Uploaded
bgruening
parents:
diff changeset
568 When "re-seeding," Bowtie 2 simply chooses a new set of reads (same length, same number of
221e740377ca Uploaded
bgruening
parents:
diff changeset
569 mismatches allowed) at different offsets and searches for more alignments. A read is considered
221e740377ca Uploaded
bgruening
parents:
diff changeset
570 to have repetitive seeds if the total number of seed hits divided by the number of seeds
221e740377ca Uploaded
bgruening
parents:
diff changeset
571 that aligned at least once is greater than 300. Default: 2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
572
221e740377ca Uploaded
bgruening
parents:
diff changeset
573
221e740377ca Uploaded
bgruening
parents:
diff changeset
574 Bowtie 2 Scoring options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
575
221e740377ca Uploaded
bgruening
parents:
diff changeset
576 --score_min "func" Sets a function governing the minimum alignment score needed for an alignment to be considered
221e740377ca Uploaded
bgruening
parents:
diff changeset
577 "valid" (i.e. good enough to report). This is a function of read length. For instance, specifying
221e740377ca Uploaded
bgruening
parents:
diff changeset
578 L,0,-0.2 sets the minimum-score function f to f(x) = 0 + -0.2 * x, where x is the read length.
221e740377ca Uploaded
bgruening
parents:
diff changeset
579 See also: setting function options at http://bowtie-bio.sourceforge.net/bowtie2. The default is
221e740377ca Uploaded
bgruening
parents:
diff changeset
580 L,0,-0.2.
221e740377ca Uploaded
bgruening
parents:
diff changeset
581
221e740377ca Uploaded
bgruening
parents:
diff changeset
582
221e740377ca Uploaded
bgruening
parents:
diff changeset
583 Bowtie 2 Reporting options::
221e740377ca Uploaded
bgruening
parents:
diff changeset
584
221e740377ca Uploaded
bgruening
parents:
diff changeset
585 --most_valid_alignments INT This used to be the Bowtie 2 parameter -M. As of Bowtie 2 version 2.0.0 beta7 the option -M is
221e740377ca Uploaded
bgruening
parents:
diff changeset
586 deprecated. It will be removed in subsequent versions. What used to be called -M mode is still the
221e740377ca Uploaded
bgruening
parents:
diff changeset
587 default mode, but adjusting the -M setting is deprecated. Use the -D and -R options to adjust the
221e740377ca Uploaded
bgruening
parents:
diff changeset
588 effort expended to find valid alignments.
221e740377ca Uploaded
bgruening
parents:
diff changeset
589
221e740377ca Uploaded
bgruening
parents:
diff changeset
590 For reference, this used to be the old (now deprecated) description of -M:
221e740377ca Uploaded
bgruening
parents:
diff changeset
591 Bowtie 2 searches for at most INT+1 distinct, valid alignments for each read. The search terminates when it
221e740377ca Uploaded
bgruening
parents:
diff changeset
592 can't find more distinct valid alignments, or when it finds INT+1 distinct alignments, whichever
221e740377ca Uploaded
bgruening
parents:
diff changeset
593 happens first. Only the best alignment is reported. Information from the other alignments is used to
221e740377ca Uploaded
bgruening
parents:
diff changeset
594 estimate mapping quality and to set SAM optional fields, such as AS:i and XS:i. Increasing -M makes
221e740377ca Uploaded
bgruening
parents:
diff changeset
595 Bowtie 2 slower, but increases the likelihood that it will pick the correct alignment for a read that
221e740377ca Uploaded
bgruening
parents:
diff changeset
596 aligns many places. For reads that have more than INT+1 distinct, valid alignments, Bowtie 2 does not
221e740377ca Uploaded
bgruening
parents:
diff changeset
597 guarantee that the alignment reported is the best possible in terms of alignment score. -M is
221e740377ca Uploaded
bgruening
parents:
diff changeset
598 always used and its default value is set to 10.
221e740377ca Uploaded
bgruening
parents:
diff changeset
599
221e740377ca Uploaded
bgruening
parents:
diff changeset
600 </help>
221e740377ca Uploaded
bgruening
parents:
diff changeset
601 </tool>