comparison maxbin2.xml @ 5:7160fa1ecb30 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/maxbin2/ commit 5efe64a2c3cb7495d708f539d341fa53fba07fe4
author iuc
date Fri, 03 Oct 2025 15:57:34 +0000
parents 9d11c2c0ff24
children
comparison
equal deleted inserted replaced
4:9d11c2c0ff24 5:7160fa1ecb30
1 <tool id="maxbin2" name="MaxBin2" version="@MAXBIN_VERSION@+galaxy3"> 1 <tool id="maxbin2" name="MaxBin2" version="@MAXBIN_VERSION@+galaxy6">
2 <description>clusters metagenomic contigs into bins</description> 2 <description>clusters metagenomic contigs into bins</description>
3 <xrefs>
4 <xref type="bio.tools">masigpro</xref>
5 </xrefs>
6 <macros> 3 <macros>
7 <token name="@MAXBIN_VERSION@">2.2.7</token> 4 <token name="@MAXBIN_VERSION@">2.2.7</token>
8 <xml name="contig"> 5 <xml name="contig">
9 <param argument="-contig" type="data" format="fasta,fasta.gz" label="Contig file"/> 6 <param argument="-contig" type="data" format="fasta,fasta.gz" label="Contig file"/>
10 </xml> 7 </xml>
17 <xml name="reads_extra_params"> 14 <xml name="reads_extra_params">
18 <param name="output_abundances" type="boolean" checked="false" label="Output abundances" help="" /> 15 <param name="output_abundances" type="boolean" checked="false" label="Output abundances" help="" />
19 <param argument="--reassembly" type="boolean" truevalue="-reassembly" falsevalue="" checked="false" label="Reassembly" help="Reassembly option is still highly experimental. To use this function, you need to feed MaxBin interleaved paired-end fastq or fasta file." /> 16 <param argument="--reassembly" type="boolean" truevalue="-reassembly" falsevalue="" checked="false" label="Reassembly" help="Reassembly option is still highly experimental. To use this function, you need to feed MaxBin interleaved paired-end fastq or fasta file." />
20 </xml> 17 </xml>
21 </macros> 18 </macros>
19 <xrefs>
20 <xref type="bio.tools">maxbin</xref>
21 </xrefs>
22 <requirements> 22 <requirements>
23 <requirement type="package" version="@MAXBIN_VERSION@">maxbin2</requirement> 23 <requirement type="package" version="@MAXBIN_VERSION@">maxbin2</requirement>
24 </requirements> 24 </requirements>
25 <version_command><![CDATA[run_MaxBin.pl -version | head -n 1]]></version_command> 25 <version_command><![CDATA[run_MaxBin.pl -version | head -n 1]]></version_command>
26 <command detect_errors="exit_code"><![CDATA[ 26 <command detect_errors="exit_code"><![CDATA[
27 ## generate read or abundance files 27 ## generate read or abundance files
28 #import re
28 #if $assembly.inputs.type == 'reads' 29 #if $assembly.inputs.type == 'reads'
29 #if $assembly.type == 'individual' 30 #if $assembly.type == 'individual'
30 echo '$assembly.inputs.reads' >> reads_list && 31 ## uncompress .gz reads files if necessary
32 #set $e = $assembly.inputs.reads
33 #set $identifier = re.sub('[^\w\-\\.]', '_', str($e.element_identifier))
34 #if $e.ext.endswith(".gz")
35 gunzip -c '$e' > '$identifier' &&
36 echo '$identifier' >> reads_list &&
37 #else
38 ln -s '$e' '$identifier' &&
39 echo '$identifier' >> reads_list &&
40 #end if
31 #else 41 #else
32 #for $r in $assembly.inputs.reads 42 #for $i, $r in enumerate($assembly.inputs.reads)
33 #if $r 43 #if $r
34 echo '$r' >> reads_list && 44 #set $identifier = re.sub('[^\w\-\\.]', '_', str($r.element_identifier))
45 #set $newid = $identifier + '_' + str($i)
46 #if $r.ext.endswith(".gz")
47 gunzip -c '$r' > '$newid' &&
48 echo '$newid' >> reads_list &&
49 #else
50 ln -s '$r' '$newid' &&
51 echo '$newid' >> reads_list &&
52 #end if
35 #end if 53 #end if
36 #end for 54 #end for
37 #end if 55 #end if
38 #else if $assembly.inputs.type == 'abund' 56 #else if $assembly.inputs.type == 'abund'
39 #if $assembly.type == 'individual' 57 #if $assembly.type == 'individual'
92 </param> 110 </param>
93 <when value="individual"> 111 <when value="individual">
94 <conditional name="inputs"> 112 <conditional name="inputs">
95 <expand macro="input_type"/> 113 <expand macro="input_type"/>
96 <when value="reads"> 114 <when value="reads">
97 <param argument="-reads" type="data" format="fasta,fastq" label="Reads file"/> 115 <param argument="-reads" type="data" format="fasta,fastq,fastq.gz,fasta.gz" label="Reads file"/>
98 <expand macro="reads_extra_params"/> 116 <expand macro="reads_extra_params"/>
99 </when> 117 </when>
100 <when value="abund"> 118 <when value="abund">
101 <param argument="-abund" type="data" format="tabular" label="Abundance file"/> 119 <param argument="-abund" type="data" format="tabular" label="Abundance file"/>
102 </when> 120 </when>
342 <has_text text="out.002.fasta"/> 360 <has_text text="out.002.fasta"/>
343 <has_text text="2878"/> 361 <has_text text="2878"/>
344 </assert_contents> 362 </assert_contents>
345 </output> 363 </output>
346 </test> 364 </test>
365 <!-- test w contigs and reads in fastqsanger format as input -->
366 <test expect_num_outputs="4">
367 <param name="contig" value="test4_contigs.fasta" ftype="fasta" />
368 <conditional name="assembly">
369 <param name="type" value="individual"/>
370 <conditional name="inputs">
371 <param name="type" value="reads"/>
372 <param name="reads" value="test4_reads.fastqsanger" ftype="fastqsanger"/>
373 <param name="output_abundances" value="false"/>
374 <param name="reassembly" value=""/>
375 </conditional>
376 </conditional>
377 <section name="adv">
378 <param name="min_contig_length" value="1000"/>
379 <param name="max_iteration" value="50"/>
380 <param name="prob_threshold" value="0.5"/>
381 </section>
382 <section name="output">
383 <param name="plotmarker" value=""/>
384 <param name="marker" value="false"/>
385 <param name="markers" value="false" />
386 <param name="log" value="false"/>
387 <param name="markerset" value="107"/>
388 </section>
389 <output_collection name="bins" type="list" count="2">
390 <element name="001" file="4/out.001.fasta" ftype="fasta"/>
391 <element name="002" file="4/out.002.fasta" ftype="fasta"/>
392 </output_collection>
393 <output name="summary" file="4/out.summary" ftype="tabular" />
394 <output name="noclass" file="4/out.noclass" ftype="fasta" />
395 <output name="toshort" file="4/out.tooshort" ftype="fasta" />
396 </test>
397 <!-- test w contigs and reads in fastqsanger format as input (and whitespace in reads filename)-->
398 <test expect_num_outputs="4">
399 <param name="contig" value="test4_contigs.fasta" ftype="fasta" />
400 <conditional name="assembly">
401 <param name="type" value="individual"/>
402 <conditional name="inputs">
403 <param name="type" value="reads"/>
404 <param name="reads" value="test4_reads 2.fastqsanger" ftype="fastqsanger"/>
405 <param name="output_abundances" value="false"/>
406 <param name="reassembly" value=""/>
407 </conditional>
408 </conditional>
409 <section name="adv">
410 <param name="min_contig_length" value="1000"/>
411 <param name="max_iteration" value="50"/>
412 <param name="prob_threshold" value="0.5"/>
413 </section>
414 <section name="output">
415 <param name="plotmarker" value=""/>
416 <param name="marker" value="false"/>
417 <param name="markers" value="false" />
418 <param name="log" value="false"/>
419 <param name="markerset" value="107"/>
420 </section>
421 <output_collection name="bins" type="list" count="2">
422 <element name="001" file="4/out.001.fasta" ftype="fasta"/>
423 <element name="002" file="4/out.002.fasta" ftype="fasta"/>
424 </output_collection>
425 <output name="summary" file="4/out.summary" ftype="tabular" />
426 <output name="noclass" file="4/out.noclass" ftype="fasta" />
427 <output name="toshort" file="4/out.tooshort" ftype="fasta" />
428 </test>
429 <!-- test w contigs and reads in fastqsanger.gz format as input -->
430 <test expect_num_outputs="4">
431 <param name="contig" value="test4_contigs.fasta" ftype="fasta" />
432 <conditional name="assembly">
433 <param name="type" value="individual"/>
434 <conditional name="inputs">
435 <param name="type" value="reads"/>
436 <param name="reads" value="test4_reads.fastqsanger.gz" ftype="fastqsanger.gz"/>
437 <param name="output_abundances" value="false"/>
438 <param name="reassembly" value=""/>
439 </conditional>
440 </conditional>
441 <section name="adv">
442 <param name="min_contig_length" value="1000"/>
443 <param name="max_iteration" value="50"/>
444 <param name="prob_threshold" value="0.5"/>
445 </section>
446 <section name="output">
447 <param name="plotmarker" value=""/>
448 <param name="marker" value="false"/>
449 <param name="markers" value="false" />
450 <param name="log" value="false"/>
451 <param name="markerset" value="107"/>
452 </section>
453 <output_collection name="bins" type="list" count="2">
454 <element name="001" file="4/out.001.fasta" ftype="fasta"/>
455 <element name="002" file="4/out.002.fasta" ftype="fasta"/>
456 </output_collection>
457 <output name="summary" file="4/out.summary" ftype="tabular" />
458 <output name="noclass" file="4/out.noclass" ftype="fasta" />
459 <output name="toshort" file="4/out.tooshort" ftype="fasta" />
460 </test>
461 <!-- test w co-assembled contigs and multiple reads as .gz and optional outputs -->
462 <test expect_num_outputs="9">
463 <param name="contig" value="test4_contigs.fasta" ftype="fasta" />
464 <conditional name="assembly">
465 <param name="type" value="coassembly"/>
466 <conditional name="inputs">
467 <param name="type" value="reads"/>
468 <param name="reads" value="test4_reads.fastqsanger.gz,test4_reads.fastqsanger.gz" ftype="fasta"/>
469 <param name="output_abundances" value="true"/>
470 <param name="reassembly" value=""/>
471 </conditional>
472 </conditional>
473 <section name="adv">
474 <param name="min_contig_length" value="1000"/>
475 <param name="max_iteration" value="50"/>
476 <param name="prob_threshold" value="0.5"/>
477 </section>
478 <section name="output">
479 <param name="plotmarker" value="true"/>
480 <param name="marker" value="true"/>
481 <param name="markers" value="true" />
482 <param name="log" value="true"/>
483 <param name="markerset" value="107"/>
484 </section>
485 <output_collection name="bins" type="list" count="2">
486 <element name="001" file="4/out.001.fasta" ftype="fasta"/>
487 <element name="002" file="4/out.002.fasta" ftype="fasta"/>
488 </output_collection>
489 <output name="summary" ftype="tabular">
490 <assert_contents>
491 <has_text text="Completeness"/>
492 <has_text text="out.001.fasta"/>
493 </assert_contents>
494 </output>
495 <output name="noclass" file="4/out.noclass" ftype="fasta" />
496 <output name="toshort" file="4/out.tooshort" ftype="fasta" />
497 <output name="log" ftype="txt" >
498 <assert_contents>
499 <has_text text="Input contig"/>
500 <has_text text="Elapsed time"/>
501 <has_text text="Yielded 2 bins for contig (scaffold) file"/>
502 </assert_contents>
503 </output>
504 <output name="abundout" file="4/out.abund1" ftype="tabular" />
505 <output name="marker" file="4/out.marker" ftype="tabular" />
506 <output name="plot" file="4/out.marker.pdf" ftype="pdf" compare="sim_size" />
507 <output_collection name="markers" type="list" count="2">
508 <element name="001" ftype="fasta">
509 <assert_contents>
510 <has_text text=">out.001.Methyltransf_5"/>
511 </assert_contents>
512 </element>
513 <element name="002" ftype="fasta">
514 <assert_contents>
515 <has_text text=">out.002.Methyltransf_5"/>
516 </assert_contents>
517 </element>
518 </output_collection>
519 </test>
347 </tests> 520 </tests>
348 <help><![CDATA[ 521 <help><![CDATA[
349 MaxBin is a software that clusters metagenomic contigs into different bins, 522 MaxBin is a software that clusters metagenomic contigs into different bins,
350 each consists (hopefully) of contigs from one species. MaxBin uses the 523 each consists (hopefully) of contigs from one species. MaxBin uses the
351 nucleotide composition information and contig abundance information to do 524 nucleotide composition information and contig abundance information to do
362 535
363 The abundance information can be provided as tabular file: 536 The abundance information can be provided as tabular file:
364 537
365 For example, assume I have three contigs named A0001, A0002, and A0003, then my abundance file will look like 538 For example, assume I have three contigs named A0001, A0002, and A0003, then my abundance file will look like
366 539
367 A0001 30.89 540 ===== =====
368 A0002 20.02 541 A0001 30.89
369 A0003 78.93 542 A0002 20.02
543 A0003 78.93
544 ===== =====
545
370 546
371 Reads/Abundundance files can be given in multiple files. 547 Reads/Abundundance files can be given in multiple files.
372 548
373 By default MaxBin will look for 107 marker genes present in >95% of bacteria. 549 By default MaxBin will look for 107 marker genes present in >95% of bacteria.
374 Alternatively you can also choose 40 marker gene sets that are universal among 550 Alternatively you can also choose 40 marker gene sets that are universal among