comparison minimap2.xml @ 7:831dcb48efa1 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/minimap2 commit 7cb87c310b34cb2af2547ad8a14679107fd86d5d
author iuc
date Sat, 04 Nov 2017 05:40:54 -0400
parents 4d84d86b368e
children 6090793a47e8
comparison
equal deleted inserted replaced
6:4d84d86b368e 7:831dcb48efa1
1 <?xml version="1.0"?> 1 <?xml version="1.0"?>
2 <tool id="minimap2" name="Map with minimap2" version="2.3" profile="17.01"> 2 <tool id="minimap2" name="Map with minimap2" version="2.3" profile="17.01">
3 <description>- A fast pairwise aligner for genomic and spliced nucleotide sequences</description> 3 <description>A fast pairwise aligner for genomic and spliced nucleotide sequences</description>
4 <requirements> 4 <requirements>
5 <requirement type="package" version="2.3">minimap2</requirement> 5 <requirement type="package" version="2.3">minimap2</requirement>
6 <requirement type="package" version="1.6">samtools</requirement> 6 <requirement type="package" version="1.6">samtools</requirement>
7 </requirements> 7 </requirements>
8 <version_command>minimap2 --version</version_command> 8 <version_command>minimap2 --version</version_command>
9 <command> 9 <command>
10 <![CDATA[ 10 <![CDATA[
11 #if $reference_source.reference_source_selector == 'history': 11 #if $reference_source.reference_source_selector == 'history':
12 ln -f -s '$reference_source.ref_file' reference.fa && 12 ln -f -s '$reference_source.ref_file' reference.fa &&
13 #else: 13 #else:
14 ln -f -s '$reference_source.ref_file.fields.path' reference.fa && 14 ln -f -s '$reference_source.ref_file.fields.path' reference.fa &&
15 #end if 15 #end if
60 #end if 60 #end if
61 #if $alignment_options.B: 61 #if $alignment_options.B:
62 -B $alignment_options.B 62 -B $alignment_options.B
63 #end if 63 #end if
64 #if $alignment_options.O: 64 #if $alignment_options.O:
65 -O $alignment_options.O 65 #if $alignment_options.O2:
66 #end if 66 -O $alignment_options.O,$alignment_options.O2
67 #end if
68 -O $alignment_options.O
69 #end if
67 #if $alignment_options.E: 70 #if $alignment_options.E:
68 -E $alignment_options.E 71 #if $alignment_options.E2:
72 -E $alignment_options.E,$alignment_options.E2
73 #else
74 -E $alignment_options
75 #end if
69 #end if 76 #end if
70 #if $alignment_options.z: 77 #if $alignment_options.z:
71 $alignment_options.z 78 $alignment_options.z
72 #end if 79 #end if
73 #if $alignment_options.s: 80 #if $alignment_options.s:
90 #if $fastq_input.fastq_input_selector in ['single', 'paired_iv']: 97 #if $fastq_input.fastq_input_selector in ['single', 'paired_iv']:
91 '$fastq_input.fastq_input1' 98 '$fastq_input.fastq_input1'
92 #else if $fastq_input.fastq_input_selector == 'paired': 99 #else if $fastq_input.fastq_input_selector == 'paired':
93 '$fastq_input.fastq_input1' '$fastq_input.fastq_input2' 100 '$fastq_input.fastq_input1' '$fastq_input.fastq_input2'
94 #else if $fastq_input.fastq_input_selector == 'paired_collection': 101 #else if $fastq_input.fastq_input_selector == 'paired_collection':
95 '$fastq_input.fastq_input1.forward' '$fastq_input.fastq_input2.reverse' 102 '$fastq_input.fastq_input1.forward' '$fastq_input.fastq_input1.reverse'
96 #end if 103 #end if
97 | samtools sort 104 | samtools sort
98 -@\${GALAXY_SLOTS:-2} 105 -@\${GALAXY_SLOTS:-2}
99 -O BAM 106 -O $io_options.output_format
100 #if $io_options.output_format == 'CRAM': 107 #if $io_options.output_format == 'CRAM':
101 -l 0| samtools view -T reference.fa -C 108 --reference reference.fa
102 #end if 109 #end if
103 > '$alignment_output' 110 -o '$alignment_output'
104 ]]> 111 ]]>
105 </command> 112 </command>
106 <inputs> 113 <inputs>
107 <conditional name="reference_source"> 114 <conditional name="reference_source">
108 <param name="reference_source_selector" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options. See `Indexes` section of help below"> 115 <param name="reference_source_selector" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options. See `Indexes` section of help below">
161 <option value="ava-pb">-Hk19 -w5 -Xp0 -m100 -g10000 --max-chain-skip 25 (PacBio read overlap)</option> 168 <option value="ava-pb">-Hk19 -w5 -Xp0 -m100 -g10000 --max-chain-skip 25 (PacBio read overlap)</option>
162 <option value="ava-ont">-k15 -w5 -Xp0 -m100 -g10000 --max-chain-skip 25 (ONT read overlap)</option> 169 <option value="ava-ont">-k15 -w5 -Xp0 -m100 -g10000 --max-chain-skip 25 (ONT read overlap)</option>
163 <option value="splice">long-read spliced alignment</option> 170 <option value="splice">long-read spliced alignment</option>
164 <option value="sr">short single-end reads without splicing</option> 171 <option value="sr">short single-end reads without splicing</option>
165 </param> 172 </param>
166 <section name="mapping_options" title="Set advanced mapping options" help="Sets -f, -g, -G, -F, -r, -n, -m, -X, -p, and -N options." expanded="False"> 173 <section name="mapping_options" title="Set advanced mapping options" help="Sets -f, -g, -G, -F, -r, -n, -m, -X, -p and -N options." expanded="False">
167 <param argument="-f" type="float" value="" optional="true" label="filter out top FLOAT fraction of repetitive minimizers" help="default=0.0002"/> 174 <param argument="-f" type="float" value="" optional="true" label="filter out top FLOAT fraction of repetitive minimizers" help="default=0.0002"/>
168 <param argument="-g" type="integer" value="" optional="true" label="stop chain enlongation if there are no minimizers in INT-bp" help="default=5000"/> 175 <param argument="-g" type="integer" value="" optional="true" label="stop chain enlongation if there are no minimizers in INT-bp" help="default=5000"/>
169 <param argument="-G" type="integer" value="" optional="true" label="max intron length in thousand (effective with -xsplice; changing -r)" help="default=200"/> 176 <param argument="-G" type="integer" value="" optional="true" label="max intron length in thousand (effective with -xsplice; changing -r)" help="default=200"/>
170 <param argument="-F" type="integer" value="" optional="true" label="max fragment length (effective with -xsr or in the fragment mode)" help="default=800" /> 177 <param argument="-F" type="integer" value="" optional="true" label="max fragment length (effective with -xsr or in the fragment mode)" help="default=800" />
171 <param argument="-r" type="integer" value="" optional="true" label="bandwidth used in chaining and DP-based alignment" help="default=500" /> 178 <param argument="-r" type="integer" value="" optional="true" label="bandwidth used in chaining and DP-based alignment" help="default=500" />
173 <param argument="-m" type="integer" value="" optional="true" label="minimal chaining score (matching bases minus log gap penalty)" help="default=40"/> 180 <param argument="-m" type="integer" value="" optional="true" label="minimal chaining score (matching bases minus log gap penalty)" help="default=40"/>
174 <param argument="-X" type="boolean" truevalue="-X" falsevalue="" optional="true" label="skip self and dual mappings (for the all-vs-all mode)"/> 181 <param argument="-X" type="boolean" truevalue="-X" falsevalue="" optional="true" label="skip self and dual mappings (for the all-vs-all mode)"/>
175 <param argument="-p" type="float" value="" max="1" optional="true" label="min secondary-to-primary score ratio" help="default=0.8"/> 182 <param argument="-p" type="float" value="" max="1" optional="true" label="min secondary-to-primary score ratio" help="default=0.8"/>
176 <param argument="-N" type="integer" min="0" optional="true" label="retain at most INT secondary alignments" help="default=5"/> 183 <param argument="-N" type="integer" min="0" optional="true" label="retain at most INT secondary alignments" help="default=5"/>
177 </section> 184 </section>
178 <section name="alignment_options" title="Set advanced alignment options" help="Sets -Q, -L, -R, -c, --cs, and -K options." expanded="False"> 185 <section name="alignment_options" title="Set advanced alignment options" help="Sets -A, -B, -O, -E, -z, -s and -u options." expanded="False">
179 <param argument="-A" type="integer" optional="true" label="Score for a sequence match" help="default=2"/> 186 <param argument="-A" type="integer" optional="true" label="Score for a sequence match" help="default=2"/>
180 <param argument="-B" type="integer" optional="true" label="Penalty for a mismatch" help="-B; default=4" /> 187 <param argument="-B" type="integer" optional="true" label="Penalty for a mismatch" help="-B; default=4" />
181 <param argument="-O" type="text" optional="true" label="Gap open penalties for deletions and insertions" help="-O; default=4,24"> 188 <param argument="-O" type="integer" min="0" optional="true" label="Gap open penalties for deletions" help="-O; default=4"/>
182 <sanitizer invalid_char=""> 189 <param name="-O2" type="integer" min="0" optional="true" label="Gap open penalties for insertions" help="-O; default=24"/>
183 <valid initial="string.digits"><add value=","/> </valid> 190 <param argument="-E" type="integer" min="0" optional="true" label="Gap extension penalties; a gap of size k cost &#39;-O + -E*k&#39;. If two numbers are specified, the first is the penalty of extending a deletion and the second for extending an insertion" help="-E; default=2"/>
184 </sanitizer> 191 <param name="E2" type="integer" min="0" optional="true" label="Gap extension penalty for extending an insertion; if left empty uses the value specified for Gap extension penalties above" help="-E; default=1"/>
185 </param>
186 <param argument="-E" type="text" optional="true" label="Gap extension penalties; a gap of size k cost &#39;-O + -E*k&#39;. If two numbers are specified, the first is the penalty of extending a deletion and the second for extending an insertion" help="-E; default=2,1">
187 <sanitizer invalid_char="">
188 <valid initial="string.digits"><add value=","/> </valid>
189 </sanitizer>
190 </param>
191 <param argument="-z" type="integer" optional="true" label="Z-drop score" help="default=400"/> 192 <param argument="-z" type="integer" optional="true" label="Z-drop score" help="default=400"/>
192 <param argument="-s" type="integer" optional="true" label="minimal peak DP alignment score" help="default=80"/> 193 <param argument="-s" type="integer" optional="true" label="minimal peak DP alignment score" help="default=80"/>
193 <param argument="-u" type="select" optional="true" label="how to find GT-AG"> 194 <param argument="-u" type="select" optional="true" label="how to find GT-AG">
194 <option value="n">don't match GT-AG</option> 195 <option value="n">don't match GT-AG</option>
195 <option value="f">transcript strand</option> 196 <option value="f">transcript strand</option>
196 <option value="b">both strands</option> 197 <option value="b">both strands</option>
197 </param> 198 </param>
198 </section> 199 </section>
199 <section name="io_options" title="Set advanced output options" help="Sets -T, -h, -a, -C, -V, -Y, and -M options." expanded="False"> 200 <section name="io_options" title="Set advanced output options" help="Sets -Q, -L, -R, -c, --cs and -K options." expanded="False">
200 <param name="output_format" type="select" label="Produce BAM or CRAM file?"> 201 <param name="output_format" type="select" label="Produce BAM or CRAM file?">
201 <option value="BAM">BAM</option> 202 <option value="BAM">BAM</option>
202 <option value="CRAM">CRAM</option> 203 <option value="CRAM">CRAM</option>
203 </param> 204 </param>
204 <param argument="-Q" type="boolean" truevalue="-Q" falsevalue="" optional="true" label="don't output base quality"/> 205 <param argument="-Q" type="boolean" truevalue="-Q" falsevalue="" optional="true" label="don't output base quality"/>
235 </change_format> 236 </change_format>
236 </data> 237 </data>
237 </outputs> 238 </outputs>
238 <tests> 239 <tests>
239 <test> 240 <test>
241 <!-- test single input -->
242 <param name="reference_source_selector" value="history" />
243 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
244 <param name="fastq_input_selector" value="single"/>
245 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fasta1.fa"/>
246 <param name="analysis_type_selector" value="sr"/>
247 <output name="alignment_output" ftype="bam" file="minimap2-test1-fasta.bam" lines_diff="2" />
248 </test>
249 <test>
250 <!-- test cram output -->
251 <param name="reference_source_selector" value="history" />
252 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
253 <param name="fastq_input_selector" value="single"/>
254 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fasta1.fa"/>
255 <param name="analysis_type_selector" value="sr"/>
256 <param name="output_format" value="CRAM"/>
257 <output name="alignment_output" ftype="cram" file="minimap2-test1-fasta.cram" compare="sim_size" />
258 </test>
259 <test>
260 <!-- test paired input -->
240 <param name="reference_source_selector" value="history" /> 261 <param name="reference_source_selector" value="history" />
241 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> 262 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
242 <param name="fastq_input_selector" value="paired"/> 263 <param name="fastq_input_selector" value="paired"/>
243 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/> 264 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/>
244 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/> 265 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
245 <param name="analysis_type_selector" value="sr"/> 266 <param name="analysis_type_selector" value="sr"/>
246 <output name="alignment_output" ftype="bam" file="bwa-mem-test1.bam" lines_diff="2" /> 267 <output name="alignment_output" ftype="bam" file="minimap2-test1.bam" lines_diff="2" />
247 </test> 268 </test>
248 <test> 269 <test>
249 <param name="reference_source_selector" value="history" /> 270 <!-- test paired input with one pair compressed -->
250 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
251 <param name="fastq_input_selector" value="single"/>
252 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fasta1.fa"/>
253 <param name="analysis_type_selector" value="sr"/>
254 <output name="alignment_output" ftype="bam" file="bwa-mem-test1-fasta.bam" lines_diff="2" />
255 </test>
256 <test>
257 <param name="reference_source_selector" value="history" /> 271 <param name="reference_source_selector" value="history" />
258 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> 272 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
259 <param name="fastq_input_selector" value="paired"/> 273 <param name="fastq_input_selector" value="paired"/>
260 <param name="fastq_input1" ftype="fastqsanger.gz" value="bwa-mem-fastq1.fq.gz"/> 274 <param name="fastq_input1" ftype="fastqsanger.gz" value="bwa-mem-fastq1.fq.gz"/>
261 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/> 275 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/>
262 <param name="analysis_type_selector" value="sr"/> 276 <param name="analysis_type_selector" value="sr"/>
263 <output name="alignment_output" ftype="bam" file="bwa-mem-test1.bam" lines_diff="2" /> 277 <output name="alignment_output" ftype="bam" file="minimap2-test1.bam" lines_diff="2" />
264 </test> 278 </test>
265 <test> 279 <test>
280 <!-- test collection input -->
266 <param name="reference_source_selector" value="history" /> 281 <param name="reference_source_selector" value="history" />
267 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> 282 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/>
268 <param name="fastq_input_selector" value="paired"/> 283 <param name="fastq_input_selector" value="paired_collection"/>
269 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/> 284 <param name="fastq_input1">
270 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/> 285 <collection type="paired">
286 <element name="forward" value="bwa-mem-fastq1.fq" />
287 <element name="reverse" value="bwa-mem-fastq2.fq" />
288 </collection>
289 </param>
271 <param name="analysis_type_selector" value="sr"/> 290 <param name="analysis_type_selector" value="sr"/>
272 <output name="alignment_output" ftype="bam" file="bwa-mem-test2.bam" lines_diff="2" /> 291 <output name="alignment_output" ftype="bam" file="minimap2-test2.bam" lines_diff="2" />
292 </test>
293 <test>
294 <!-- test data table reference -->
295 <param name="reference_source_selector" value="cached" />
296 <param name="ref_file" value="bwa-mem-mt-genome"/>
297 <param name="fastq_input_selector" value="single"/>
298 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fasta1.fa"/>
299 <param name="analysis_type_selector" value="sr"/>
300 <output name="alignment_output" ftype="bam" file="minimap2-test1-fasta.bam" lines_diff="2" />
273 </test> 301 </test>
274 </tests> 302 </tests>
275 <help> 303 <help>
276 304
277 Users’ Guide 305 Users’ Guide
494 522
495 - Minimap2 may produce suboptimal alignments through long 523 - Minimap2 may produce suboptimal alignments through long
496 low-complexity regions where seed positions may be suboptimal. This 524 low-complexity regions where seed positions may be suboptimal. This
497 should not be a big concern because even the optimal alignment may be 525 should not be a big concern because even the optimal alignment may be
498 wrong in such regions. 526 wrong in such regions.
499
500 - Minimap2 requires SSE2 instructions to compile. It is possible to add
501 non-SSE2 support, but it would make minimap2 slower by several times.
502
503 In general, minimap2 is a young project with most code written since
504 June, 2017. It may have bugs and room for improvements. Bug reports and
505 suggestions are warmly welcomed.
506 </help> 527 </help>
507 <citations> 528 <citations>
508 <citation type="doi">10.1093/bioinformatics/btp324</citation> 529 <citation type="doi">10.1093/bioinformatics/btp324</citation>
509 <citation type="doi">10.1093/bioinformatics/btp698</citation> 530 <citation type="doi">10.1093/bioinformatics/btp698</citation>
510 <citation type="bibtex">@misc{1303.3997, 531 <citation type="bibtex">@misc{1303.3997,