Mercurial > repos > iuc > minimap2
comparison minimap2.xml @ 7:831dcb48efa1 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/minimap2 commit 7cb87c310b34cb2af2547ad8a14679107fd86d5d
author | iuc |
---|---|
date | Sat, 04 Nov 2017 05:40:54 -0400 |
parents | 4d84d86b368e |
children | 6090793a47e8 |
comparison
equal
deleted
inserted
replaced
6:4d84d86b368e | 7:831dcb48efa1 |
---|---|
1 <?xml version="1.0"?> | 1 <?xml version="1.0"?> |
2 <tool id="minimap2" name="Map with minimap2" version="2.3" profile="17.01"> | 2 <tool id="minimap2" name="Map with minimap2" version="2.3" profile="17.01"> |
3 <description>- A fast pairwise aligner for genomic and spliced nucleotide sequences</description> | 3 <description>A fast pairwise aligner for genomic and spliced nucleotide sequences</description> |
4 <requirements> | 4 <requirements> |
5 <requirement type="package" version="2.3">minimap2</requirement> | 5 <requirement type="package" version="2.3">minimap2</requirement> |
6 <requirement type="package" version="1.6">samtools</requirement> | 6 <requirement type="package" version="1.6">samtools</requirement> |
7 </requirements> | 7 </requirements> |
8 <version_command>minimap2 --version</version_command> | 8 <version_command>minimap2 --version</version_command> |
9 <command> | 9 <command> |
10 <![CDATA[ | 10 <![CDATA[ |
11 #if $reference_source.reference_source_selector == 'history': | 11 #if $reference_source.reference_source_selector == 'history': |
12 ln -f -s '$reference_source.ref_file' reference.fa && | 12 ln -f -s '$reference_source.ref_file' reference.fa && |
13 #else: | 13 #else: |
14 ln -f -s '$reference_source.ref_file.fields.path' reference.fa && | 14 ln -f -s '$reference_source.ref_file.fields.path' reference.fa && |
15 #end if | 15 #end if |
60 #end if | 60 #end if |
61 #if $alignment_options.B: | 61 #if $alignment_options.B: |
62 -B $alignment_options.B | 62 -B $alignment_options.B |
63 #end if | 63 #end if |
64 #if $alignment_options.O: | 64 #if $alignment_options.O: |
65 -O $alignment_options.O | 65 #if $alignment_options.O2: |
66 #end if | 66 -O $alignment_options.O,$alignment_options.O2 |
67 #end if | |
68 -O $alignment_options.O | |
69 #end if | |
67 #if $alignment_options.E: | 70 #if $alignment_options.E: |
68 -E $alignment_options.E | 71 #if $alignment_options.E2: |
72 -E $alignment_options.E,$alignment_options.E2 | |
73 #else | |
74 -E $alignment_options | |
75 #end if | |
69 #end if | 76 #end if |
70 #if $alignment_options.z: | 77 #if $alignment_options.z: |
71 $alignment_options.z | 78 $alignment_options.z |
72 #end if | 79 #end if |
73 #if $alignment_options.s: | 80 #if $alignment_options.s: |
90 #if $fastq_input.fastq_input_selector in ['single', 'paired_iv']: | 97 #if $fastq_input.fastq_input_selector in ['single', 'paired_iv']: |
91 '$fastq_input.fastq_input1' | 98 '$fastq_input.fastq_input1' |
92 #else if $fastq_input.fastq_input_selector == 'paired': | 99 #else if $fastq_input.fastq_input_selector == 'paired': |
93 '$fastq_input.fastq_input1' '$fastq_input.fastq_input2' | 100 '$fastq_input.fastq_input1' '$fastq_input.fastq_input2' |
94 #else if $fastq_input.fastq_input_selector == 'paired_collection': | 101 #else if $fastq_input.fastq_input_selector == 'paired_collection': |
95 '$fastq_input.fastq_input1.forward' '$fastq_input.fastq_input2.reverse' | 102 '$fastq_input.fastq_input1.forward' '$fastq_input.fastq_input1.reverse' |
96 #end if | 103 #end if |
97 | samtools sort | 104 | samtools sort |
98 -@\${GALAXY_SLOTS:-2} | 105 -@\${GALAXY_SLOTS:-2} |
99 -O BAM | 106 -O $io_options.output_format |
100 #if $io_options.output_format == 'CRAM': | 107 #if $io_options.output_format == 'CRAM': |
101 -l 0| samtools view -T reference.fa -C | 108 --reference reference.fa |
102 #end if | 109 #end if |
103 > '$alignment_output' | 110 -o '$alignment_output' |
104 ]]> | 111 ]]> |
105 </command> | 112 </command> |
106 <inputs> | 113 <inputs> |
107 <conditional name="reference_source"> | 114 <conditional name="reference_source"> |
108 <param name="reference_source_selector" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options. See `Indexes` section of help below"> | 115 <param name="reference_source_selector" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options. See `Indexes` section of help below"> |
161 <option value="ava-pb">-Hk19 -w5 -Xp0 -m100 -g10000 --max-chain-skip 25 (PacBio read overlap)</option> | 168 <option value="ava-pb">-Hk19 -w5 -Xp0 -m100 -g10000 --max-chain-skip 25 (PacBio read overlap)</option> |
162 <option value="ava-ont">-k15 -w5 -Xp0 -m100 -g10000 --max-chain-skip 25 (ONT read overlap)</option> | 169 <option value="ava-ont">-k15 -w5 -Xp0 -m100 -g10000 --max-chain-skip 25 (ONT read overlap)</option> |
163 <option value="splice">long-read spliced alignment</option> | 170 <option value="splice">long-read spliced alignment</option> |
164 <option value="sr">short single-end reads without splicing</option> | 171 <option value="sr">short single-end reads without splicing</option> |
165 </param> | 172 </param> |
166 <section name="mapping_options" title="Set advanced mapping options" help="Sets -f, -g, -G, -F, -r, -n, -m, -X, -p, and -N options." expanded="False"> | 173 <section name="mapping_options" title="Set advanced mapping options" help="Sets -f, -g, -G, -F, -r, -n, -m, -X, -p and -N options." expanded="False"> |
167 <param argument="-f" type="float" value="" optional="true" label="filter out top FLOAT fraction of repetitive minimizers" help="default=0.0002"/> | 174 <param argument="-f" type="float" value="" optional="true" label="filter out top FLOAT fraction of repetitive minimizers" help="default=0.0002"/> |
168 <param argument="-g" type="integer" value="" optional="true" label="stop chain enlongation if there are no minimizers in INT-bp" help="default=5000"/> | 175 <param argument="-g" type="integer" value="" optional="true" label="stop chain enlongation if there are no minimizers in INT-bp" help="default=5000"/> |
169 <param argument="-G" type="integer" value="" optional="true" label="max intron length in thousand (effective with -xsplice; changing -r)" help="default=200"/> | 176 <param argument="-G" type="integer" value="" optional="true" label="max intron length in thousand (effective with -xsplice; changing -r)" help="default=200"/> |
170 <param argument="-F" type="integer" value="" optional="true" label="max fragment length (effective with -xsr or in the fragment mode)" help="default=800" /> | 177 <param argument="-F" type="integer" value="" optional="true" label="max fragment length (effective with -xsr or in the fragment mode)" help="default=800" /> |
171 <param argument="-r" type="integer" value="" optional="true" label="bandwidth used in chaining and DP-based alignment" help="default=500" /> | 178 <param argument="-r" type="integer" value="" optional="true" label="bandwidth used in chaining and DP-based alignment" help="default=500" /> |
173 <param argument="-m" type="integer" value="" optional="true" label="minimal chaining score (matching bases minus log gap penalty)" help="default=40"/> | 180 <param argument="-m" type="integer" value="" optional="true" label="minimal chaining score (matching bases minus log gap penalty)" help="default=40"/> |
174 <param argument="-X" type="boolean" truevalue="-X" falsevalue="" optional="true" label="skip self and dual mappings (for the all-vs-all mode)"/> | 181 <param argument="-X" type="boolean" truevalue="-X" falsevalue="" optional="true" label="skip self and dual mappings (for the all-vs-all mode)"/> |
175 <param argument="-p" type="float" value="" max="1" optional="true" label="min secondary-to-primary score ratio" help="default=0.8"/> | 182 <param argument="-p" type="float" value="" max="1" optional="true" label="min secondary-to-primary score ratio" help="default=0.8"/> |
176 <param argument="-N" type="integer" min="0" optional="true" label="retain at most INT secondary alignments" help="default=5"/> | 183 <param argument="-N" type="integer" min="0" optional="true" label="retain at most INT secondary alignments" help="default=5"/> |
177 </section> | 184 </section> |
178 <section name="alignment_options" title="Set advanced alignment options" help="Sets -Q, -L, -R, -c, --cs, and -K options." expanded="False"> | 185 <section name="alignment_options" title="Set advanced alignment options" help="Sets -A, -B, -O, -E, -z, -s and -u options." expanded="False"> |
179 <param argument="-A" type="integer" optional="true" label="Score for a sequence match" help="default=2"/> | 186 <param argument="-A" type="integer" optional="true" label="Score for a sequence match" help="default=2"/> |
180 <param argument="-B" type="integer" optional="true" label="Penalty for a mismatch" help="-B; default=4" /> | 187 <param argument="-B" type="integer" optional="true" label="Penalty for a mismatch" help="-B; default=4" /> |
181 <param argument="-O" type="text" optional="true" label="Gap open penalties for deletions and insertions" help="-O; default=4,24"> | 188 <param argument="-O" type="integer" min="0" optional="true" label="Gap open penalties for deletions" help="-O; default=4"/> |
182 <sanitizer invalid_char=""> | 189 <param name="-O2" type="integer" min="0" optional="true" label="Gap open penalties for insertions" help="-O; default=24"/> |
183 <valid initial="string.digits"><add value=","/> </valid> | 190 <param argument="-E" type="integer" min="0" optional="true" label="Gap extension penalties; a gap of size k cost '-O + -E*k'. If two numbers are specified, the first is the penalty of extending a deletion and the second for extending an insertion" help="-E; default=2"/> |
184 </sanitizer> | 191 <param name="E2" type="integer" min="0" optional="true" label="Gap extension penalty for extending an insertion; if left empty uses the value specified for Gap extension penalties above" help="-E; default=1"/> |
185 </param> | |
186 <param argument="-E" type="text" optional="true" label="Gap extension penalties; a gap of size k cost '-O + -E*k'. If two numbers are specified, the first is the penalty of extending a deletion and the second for extending an insertion" help="-E; default=2,1"> | |
187 <sanitizer invalid_char=""> | |
188 <valid initial="string.digits"><add value=","/> </valid> | |
189 </sanitizer> | |
190 </param> | |
191 <param argument="-z" type="integer" optional="true" label="Z-drop score" help="default=400"/> | 192 <param argument="-z" type="integer" optional="true" label="Z-drop score" help="default=400"/> |
192 <param argument="-s" type="integer" optional="true" label="minimal peak DP alignment score" help="default=80"/> | 193 <param argument="-s" type="integer" optional="true" label="minimal peak DP alignment score" help="default=80"/> |
193 <param argument="-u" type="select" optional="true" label="how to find GT-AG"> | 194 <param argument="-u" type="select" optional="true" label="how to find GT-AG"> |
194 <option value="n">don't match GT-AG</option> | 195 <option value="n">don't match GT-AG</option> |
195 <option value="f">transcript strand</option> | 196 <option value="f">transcript strand</option> |
196 <option value="b">both strands</option> | 197 <option value="b">both strands</option> |
197 </param> | 198 </param> |
198 </section> | 199 </section> |
199 <section name="io_options" title="Set advanced output options" help="Sets -T, -h, -a, -C, -V, -Y, and -M options." expanded="False"> | 200 <section name="io_options" title="Set advanced output options" help="Sets -Q, -L, -R, -c, --cs and -K options." expanded="False"> |
200 <param name="output_format" type="select" label="Produce BAM or CRAM file?"> | 201 <param name="output_format" type="select" label="Produce BAM or CRAM file?"> |
201 <option value="BAM">BAM</option> | 202 <option value="BAM">BAM</option> |
202 <option value="CRAM">CRAM</option> | 203 <option value="CRAM">CRAM</option> |
203 </param> | 204 </param> |
204 <param argument="-Q" type="boolean" truevalue="-Q" falsevalue="" optional="true" label="don't output base quality"/> | 205 <param argument="-Q" type="boolean" truevalue="-Q" falsevalue="" optional="true" label="don't output base quality"/> |
235 </change_format> | 236 </change_format> |
236 </data> | 237 </data> |
237 </outputs> | 238 </outputs> |
238 <tests> | 239 <tests> |
239 <test> | 240 <test> |
241 <!-- test single input --> | |
242 <param name="reference_source_selector" value="history" /> | |
243 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> | |
244 <param name="fastq_input_selector" value="single"/> | |
245 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fasta1.fa"/> | |
246 <param name="analysis_type_selector" value="sr"/> | |
247 <output name="alignment_output" ftype="bam" file="minimap2-test1-fasta.bam" lines_diff="2" /> | |
248 </test> | |
249 <test> | |
250 <!-- test cram output --> | |
251 <param name="reference_source_selector" value="history" /> | |
252 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> | |
253 <param name="fastq_input_selector" value="single"/> | |
254 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fasta1.fa"/> | |
255 <param name="analysis_type_selector" value="sr"/> | |
256 <param name="output_format" value="CRAM"/> | |
257 <output name="alignment_output" ftype="cram" file="minimap2-test1-fasta.cram" compare="sim_size" /> | |
258 </test> | |
259 <test> | |
260 <!-- test paired input --> | |
240 <param name="reference_source_selector" value="history" /> | 261 <param name="reference_source_selector" value="history" /> |
241 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> | 262 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> |
242 <param name="fastq_input_selector" value="paired"/> | 263 <param name="fastq_input_selector" value="paired"/> |
243 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/> | 264 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/> |
244 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/> | 265 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/> |
245 <param name="analysis_type_selector" value="sr"/> | 266 <param name="analysis_type_selector" value="sr"/> |
246 <output name="alignment_output" ftype="bam" file="bwa-mem-test1.bam" lines_diff="2" /> | 267 <output name="alignment_output" ftype="bam" file="minimap2-test1.bam" lines_diff="2" /> |
247 </test> | 268 </test> |
248 <test> | 269 <test> |
249 <param name="reference_source_selector" value="history" /> | 270 <!-- test paired input with one pair compressed --> |
250 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> | |
251 <param name="fastq_input_selector" value="single"/> | |
252 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fasta1.fa"/> | |
253 <param name="analysis_type_selector" value="sr"/> | |
254 <output name="alignment_output" ftype="bam" file="bwa-mem-test1-fasta.bam" lines_diff="2" /> | |
255 </test> | |
256 <test> | |
257 <param name="reference_source_selector" value="history" /> | 271 <param name="reference_source_selector" value="history" /> |
258 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> | 272 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> |
259 <param name="fastq_input_selector" value="paired"/> | 273 <param name="fastq_input_selector" value="paired"/> |
260 <param name="fastq_input1" ftype="fastqsanger.gz" value="bwa-mem-fastq1.fq.gz"/> | 274 <param name="fastq_input1" ftype="fastqsanger.gz" value="bwa-mem-fastq1.fq.gz"/> |
261 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/> | 275 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/> |
262 <param name="analysis_type_selector" value="sr"/> | 276 <param name="analysis_type_selector" value="sr"/> |
263 <output name="alignment_output" ftype="bam" file="bwa-mem-test1.bam" lines_diff="2" /> | 277 <output name="alignment_output" ftype="bam" file="minimap2-test1.bam" lines_diff="2" /> |
264 </test> | 278 </test> |
265 <test> | 279 <test> |
280 <!-- test collection input --> | |
266 <param name="reference_source_selector" value="history" /> | 281 <param name="reference_source_selector" value="history" /> |
267 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> | 282 <param name="ref_file" ftype="fasta" value="bwa-mem-mt-genome.fa"/> |
268 <param name="fastq_input_selector" value="paired"/> | 283 <param name="fastq_input_selector" value="paired_collection"/> |
269 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fastq1.fq"/> | 284 <param name="fastq_input1"> |
270 <param name="fastq_input2" ftype="fastqsanger" value="bwa-mem-fastq2.fq"/> | 285 <collection type="paired"> |
286 <element name="forward" value="bwa-mem-fastq1.fq" /> | |
287 <element name="reverse" value="bwa-mem-fastq2.fq" /> | |
288 </collection> | |
289 </param> | |
271 <param name="analysis_type_selector" value="sr"/> | 290 <param name="analysis_type_selector" value="sr"/> |
272 <output name="alignment_output" ftype="bam" file="bwa-mem-test2.bam" lines_diff="2" /> | 291 <output name="alignment_output" ftype="bam" file="minimap2-test2.bam" lines_diff="2" /> |
292 </test> | |
293 <test> | |
294 <!-- test data table reference --> | |
295 <param name="reference_source_selector" value="cached" /> | |
296 <param name="ref_file" value="bwa-mem-mt-genome"/> | |
297 <param name="fastq_input_selector" value="single"/> | |
298 <param name="fastq_input1" ftype="fastqsanger" value="bwa-mem-fasta1.fa"/> | |
299 <param name="analysis_type_selector" value="sr"/> | |
300 <output name="alignment_output" ftype="bam" file="minimap2-test1-fasta.bam" lines_diff="2" /> | |
273 </test> | 301 </test> |
274 </tests> | 302 </tests> |
275 <help> | 303 <help> |
276 | 304 |
277 Users’ Guide | 305 Users’ Guide |
494 | 522 |
495 - Minimap2 may produce suboptimal alignments through long | 523 - Minimap2 may produce suboptimal alignments through long |
496 low-complexity regions where seed positions may be suboptimal. This | 524 low-complexity regions where seed positions may be suboptimal. This |
497 should not be a big concern because even the optimal alignment may be | 525 should not be a big concern because even the optimal alignment may be |
498 wrong in such regions. | 526 wrong in such regions. |
499 | |
500 - Minimap2 requires SSE2 instructions to compile. It is possible to add | |
501 non-SSE2 support, but it would make minimap2 slower by several times. | |
502 | |
503 In general, minimap2 is a young project with most code written since | |
504 June, 2017. It may have bugs and room for improvements. Bug reports and | |
505 suggestions are warmly welcomed. | |
506 </help> | 527 </help> |
507 <citations> | 528 <citations> |
508 <citation type="doi">10.1093/bioinformatics/btp324</citation> | 529 <citation type="doi">10.1093/bioinformatics/btp324</citation> |
509 <citation type="doi">10.1093/bioinformatics/btp698</citation> | 530 <citation type="doi">10.1093/bioinformatics/btp698</citation> |
510 <citation type="bibtex">@misc{1303.3997, | 531 <citation type="bibtex">@misc{1303.3997, |