comparison ectyper.xml @ 0:954b1b1ef3fb draft

planemo upload for repository https://github.com/phac-nml/galaxy_tools/tree/master/tools/ectyper commit f574c20c5f06498727d186afc4d1a92f5344eb59
author nml
date Wed, 18 Dec 2024 22:36:31 +0000
parents
children 4b4a7d9f7c9e
comparison
equal deleted inserted replaced
-1:000000000000 0:954b1b1ef3fb
1 <tool id="ectyper" name="ectyper" version="1.0.0">
2 <description>ectyper is a standalone serotyping module for Escherichia coli. It supports fasta and fastq file formats.</description>
3 <xrefs>
4 <xref type="bio.tools">ectyper</xref>
5 </xrefs>
6 <requirements>
7 <requirement type="package" version="1.0.0">ectyper</requirement>
8 </requirements>
9 <command detect_errors="exit_code">
10 <![CDATA[
11 #set $genomes = ''
12 #if hasattr($input, '__iter__')
13 #for $i in $input
14 ln -s "${i}" "${i.element_identifier}" &&
15 #if len($genomes) > 0
16 #set $genomes = $genomes + ',' + str($i.element_identifier)
17 #else
18 #set $genomes = str($i.element_identifier)
19 #end if
20 #end for
21 #else
22 ln -s "${input}" "${input.element_identifier}" &&
23 #set $genomes = $input.element_identifier
24 #end if
25
26 #if $adv_param.mash_input
27 ln -s "${adv_param.mash_input}" mash_sketch.msh &&
28 #end if
29
30
31 #if $adv_param.db_input
32 ln -s "${adv_param.db_input}" custom_db.json &&
33 #end if
34
35
36 ectyper --cores \${GALAXY_SLOTS:-4}
37 --input "${genomes}"
38 -opid '$adv_param.opid'
39 -opcov '$adv_param.opcov'
40 -hpid '$adv_param.hpid'
41 -hpcov '$adv_param.hpcov'
42
43 #if $adv_param.verifyEcoli
44 --verify
45 #end if
46
47 #if $adv_param.mash_input
48 --refseq mash_sketch.msh
49 #end if
50
51 #if $adv_param.db_input
52 --dbpath custom_db.json
53 #end if
54
55 --output '.'
56 ]]>
57 </command>
58 <inputs>
59 <param name="input" type="data" format="fastq,fasta" label="Genome(s) input(s)" help="FASTA or FASTQ file(s)"/>
60 <section name="adv_param" title="Advanced parameters" expanded="False">
61 <param name="opid" label="O antigen minimum %identity" type="integer" value="90" min="1" max="100"/>
62 <param name="opcov" label="O antigen minimum %coverage" type="integer" value="90" min="1" max="100"/>
63 <param name="hpid" label="H antigen minimum %identity" type="integer" value="95" min="1" max="100"/>
64 <param name="hpcov" label="H antigen minimum %coverage" type="integer" value="50" min="1" max="100"/>
65 <param name="verifyEcoli" type="boolean" checked="true" label="Enable E. coli species verification"/>
66 <param name="blastresults" type="boolean" checked="false" label="Include BLAST allele alignment results tab-delim file in the outputs?" />
67 <param name="logging" type="boolean" checked="false" label="Include log file in the run outputs?" />
68 <param name="mash_input" type="data" optional="true" format="binary" label="Mash genome sketches (Optional)" help="Optionally provide custom MASH genome sketch to help with species identification (otherwise default RefSeq sketch is used)"/>
69 <param name="db_input" type="data" optional="true" format="json" label="Custom database of alleles (Optional)" help="Optionally provide custom database of alleles in JSON format"/>
70 </section>
71 </inputs>
72 <outputs>
73 <data name="output_result" format="tabular" from_work_dir="output.tsv" label="${tool.name} serotype report on ${input.element_identifier}"> </data>
74 <data name="output_log" format="txt" from_work_dir="ectyper.log" label="${tool.name} log file on ${input.element_identifier}">
75 <filter>adv_param['logging']==True</filter>
76 </data>
77 <data name="output_blast" format="tabular" from_work_dir="blast_output_alleles.txt" label="${tool.name} BLAST results file on ${input.element_identifier}">
78 <filter>adv_param['blastresults']==True</filter>
79 </data>
80 </outputs>
81 <tests>
82 <test expect_num_outputs="1">
83 <param name="input" value="Escherichia2.fastq"/>
84 <assert_stderr>
85 <has_text text="O22"/>
86 <has_text text="H8"/>
87 </assert_stderr>
88 <output name="output_result" ftype="tabular" >
89 <assert_contents>
90 <has_text_matching expression="O22"/>
91 </assert_contents>
92 </output>
93 </test>
94 </tests>
95
96 <help>
97 **Syntax**
98
99
100 This tool identifies the serotype of both assembled or assembly-free Escherichia coli genome samples based on a set of the key O and H antigen determinant genes including *wzm/wzt* or *wzx/wzy* and *fliC/flkA/flmA*.
101 Unique to the tool, species identification module allows for non-E.coli genomes identification including other Escherichia genus species.
102 This version improves antigen call rates on "difficult samples" by use of an adaptive threshold. This is especially useful when antigen genes are truncated or poorly covered by raw reads.
103 If no antigen call is being predicted by the tool, try to lower %coverage parameter first. For more information on the new Quality Control module and running parameter details please visit https://github.com/phac-nml/ecoli_serotyping.
104
105
106 -----
107
108 **Input:**
109
110 Accepts a variety of inputs including both single and/or multiple FASTQ and/or FASTA file(s). Inputs might contain pure raw reads, but for more accurate results, draft assemblies are recommended.
111
112
113 The default MASH RefSeq genome sketch (https://gembox.cbcb.umd.edu/mash/refseq.genomes.k21s1000.msh) containing approximately 91K genomes is included and automatically updated every 6 months.
114
115
116
117 **Output:**
118
119 Tab-delimited report listing identified O and H antigens together with corresponding the highest-scoring alleles and normalized BLAST score defined as (%identity x %coverage) / 1e4.
120 If *verifyEcoli* parameter is enabled, final report will contain allele quality control information on results for reporting purposes. PASS (REPORTABLE) QC flag means that O and H antigen calls are of sufficient to unambiguously resolve them from all other antigens.
121
122 -----
123
124 **Parameters (Optional):**
125 - **Enable E. coli species verification:** for species verification in case samples are of non-E.coli origin
126 - **Include BLAST allele alignment results tab-delim file in the outputs?** Get reference allele sequences and detailed BLAST output
127 - **Include log file in the run outputs?:** Get optional logs of the ectyper run for a more detailed results assessment and troubleshooting
128
129 </help>
130 <citations>
131 <citation type="bibtex">
132 @misc{githubectyper,
133 author = {Laing Chad},
134 title = {ECtyper - serotyping module for Escherichia coli},
135 publisher = {GitHub},
136 journal = {GitHub repository},
137 url = {https://github.com/phac-nml/ecoli_serotyping}
138 }</citation>
139 </citations>
140 </tool>