annotate circlator.xml @ 2:c27229938e09 draft default tip

planemo upload
author leomrtns
date Mon, 20 May 2019 05:20:53 -0400
parents 34810a7283ba
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
1 <tool id="circlator" name="A tool to circularize genome assemblies" version="0.1.0">
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
2 <description>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
3 This task runs the complete Circlator pipeline. It runs the tasks: progcheck, mapreads, bam2reads, assemble, merge, clean, fixstart.
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
4 </description>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
5 <requirements>
1
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
6 <requirement type="package" version="1.5.5=py_2">circlator</requirement>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
7 <requirement type="package" version="3.23">mummer</requirement>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
8 <requirement type="package" version="1.6">canu</requirement>
0
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
9 </requirements>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
10 <command detect_errors="exit_code"><![CDATA[
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
11 circlator all
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
12 --threads \${GALAXY_SLOTS:-4}
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
13 #if str($assembly.canu_or_spades.assembler) == "spades"
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
14 --assembler spades
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
15 ${assembly.canu_or_spades.not_careful}
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
16 ${assembly.canu_or_spades.not_only_assembler}
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
17 #else if str($assembly.canu_or_spades.assembler) == "canu"
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
18 --assembler canu
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
19 --data_type ${assembly.canu_or_spades.datatype}
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
20 #end if
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
21 ${assembly.split_all_reads}
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
22 ${assembly.assemble_spades_use_first}
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
23 #if str($mapreads.bwa_opts) != ""
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
24 --bwa_opts "$mapreads.bwa_opts"
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
25 #end if
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
26 ${bam2read.b2r_discard}
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
27 #if str($bam2read.b2r_length_cutoff) != ""
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
28 --b2r_length_cutoff ${bam2read.b2r_length_cutoff}
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
29 #end if
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
30 #if str($bam2read.b2r_min_read_length) != ""
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
31 --b2r_min_read_length ${bam2read.b2r_min_read_length}
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
32 #end if
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
33 #if str($fix.fixstart_mincluster) != ""
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
34 --fixstart_mincluster $fix.fixstart_mincluster
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
35 #end if
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
36 #if str($fix.fixstart_min_id) != ""
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
37 --fixstart_min_id $fix.fixstart_min_id
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
38 #end if
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
39 $file_contigs $file_reads outdir
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
40 ]]></command>
1
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
41 <environment_variables>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
42 <environment_variable name="LC_ALL">C</environment_variable>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
43 </environment_variables>
0
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
44 <inputs>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
45 <param type="data" name="file_reads" label="Reads to be mapped to contig, in any format BWA MEM accepts" format="fastqsanger,fastqsanger.gz,fasta, fasta.gz" />
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
46 <param type="data" name="file_contigs" label="Assembly (contigs)" format="fasta" />
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
47
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
48 <section name="assembly" title="Assembly">
1
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
49 <conditional name="canu_or_spades">
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
50 <param name="assembler" type="select" label="Assembler to use for reassemblies" >
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
51 <option value="spades" selected="true">SPAdes</option>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
52 <option value="canu">Canu</option>
0
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
53 </param>
1
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
54 <when value="canu">
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
55 <param name="datatype" type="select" label="one of the 4 types of data analysed" >
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
56 <option value="pacbio-corrected" selected="true">pacbio corrected</option>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
57 <option value="pacbio-raw">pacbio raw</option>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
58 <option value="nanopore-corrected">nanopore corrected</option>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
59 <option value="nanopore-raw">nanopore raw</option>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
60 </param>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
61 </when>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
62 <when value="spades">
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
63 <param name="not_careful" argument="--assemble_not_careful" type="boolean" truevalue="--assemble_not_careful" falsevalue="" checked="false"
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
64 label="Do not use the --careful option with SPAdes" help="note that this circlator option is to NOT use an option from SPAdes; if unsure, leave it unchekced" />
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
65 <param name="not_only_assembler" argument="--assemble_not_only_assembler" truevalue="--assemble_not_only_assembler" falsevalue=""
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
66 type="boolean" checked="false" label="Do not use the --assemble-only option with SPAdes. Important: with this option, the input reads must
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
67 be in FASTQ format, otherwise SPAdes will crash because it needs quality scores to correct the reads."
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
68 help="note that this circlator option is to NOT use an option from SPAdes; if unsure, leave it unchecked"/>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
69 </when>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
70 </conditional>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
71 <param name="split_all_reads" argument="--split_all_reads" type="boolean" truevalue="--split_all_reads" falsevalue="" checked="false"
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
72 label="By default, reads mapped to shorter contigs are left unchanged. This option splits them into two, broken at the middle of the
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
73 contig to try to force circularization. May help if the assembler does not detect circular contigs (eg canu)" />
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
74 <param name="assemble_spades_use_first" argument="--assemble_spades_use_first" truevalue="--assemble_spades_use_first" falsevalue=""
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
75 checked="false" type="boolean" label="Use the first successful SPAdes assembly. Default is to try all kmers and use the assembly with
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
76 the largest N50" />
0
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
77
1
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
78 </section>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
79 <section name="mapreads" title="mapreads options">
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
80 <param name="bwa_opts" type="text" label="text with BWA options (exactly as used by BWA MEM)"/>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
81 </section>
0
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
82
1
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
83 <section name="bam2read" title="bam2reads options">
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
84 <param name="b2r_discard" argument="--b2r_discard_unmapped" truevalue="--b2r_discard_unmapped" falsevalue="" checked="false" type="boolean"
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
85 label="Check this to not keep unmapped reads" />
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
86 <param name="b2r_length_cutoff" type="integer" label="All reads mapped to contigs shorter than this will be kept (default=100000)" optional="true"/>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
87 <param name="b2r_min_read_length" type="integer" label="Minimum length of read to output (defaul=250)" optional="true"/>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
88 </section>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
89
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
90 <section name="fix" title="fixstart options">
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
91 <param name="fixstart_mincluster" type="integer" label="The -c|mincluster option of promer. Overrides promer's default value" optional="true"/>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
92 <param name="fixstart_min_id" type="float" label="Minimum percent identity of promer match between contigs and gene(s) to use as start point (dafault=70)" optional="true"/>
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
93 </section>
0
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
94
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
95 </inputs>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
96 <outputs>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
97 <data name="output_fasta" label="Output file of rearranged contigs" format="fasta" from_work_dir="outdir/06.fixstart.fasta" />
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
98 <data name="output_log" label="Log information" format="tabular" from_work_dir="outdir/06.fixstart.log" />
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
99 </outputs>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
100 <tests>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
101 <test>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
102 <param name="file_contigs" value="test_contigs.fa"/>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
103 <param name="file_reads" value="test_reads.fq.gz"/>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
104 <output name="output_log" file="06.fixstart.log"/>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
105 </test>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
106 </tests>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
107 <help><![CDATA[
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
108 The input is a genome assembly in FASTA format and corrected PacBio or nanopore reads in FASTA or FASTQ format.
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
109 Circlator will attempt to identify each circular sequence and output a linearised version of it.
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
110 It does this by assembling all reads that map to contig ends and comparing the resulting contigs with the input assembly.
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
111
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
112 The input assembly must not be too fragmented. Although Circlator will join contigs together, whenever it can identify contigs that can be
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
113 unambiguously joined, its main aim is to circularize the core genome and plasmids.
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
114
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
115 Any contigs that were identified as circular then have their start position changed.
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
116
1
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
117 Currently it does not download the uniprot database and it does not run the minimus2 pipeline. Even when running canu it may give warning messages about the SPAdes version,
34810a7283ba planemo upload
leomrtns
parents: 0
diff changeset
118 you can safely ignore those.
0
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
119 ]]></help>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
120 <citations>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
121 <citation type="bibtex">
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
122 @misc{github,
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
123 publisher = {GitHub},
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
124 journal = {GitHub repository},
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
125 url = {https://github.com/sanger-pathogens/circlator/},
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
126 }</citation>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
127 </citations>
7b25bfc2606f planemo upload
leomrtns
parents:
diff changeset
128 </tool>