comparison checkm_lineage_wf.xml @ 0:cb30bd36bfd0 draft default tip

planemo upload
author leomrtns
date Wed, 02 Oct 2019 10:51:58 -0400
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:cb30bd36bfd0
1 <tool id="checkm_lineage_wf" name="checkm lineage_wf" version="@TOOL_VERSION@">
2 <description>Runs tree, lineage_set, analyze, qa</description>
3 <macros>
4 <import>macros.xml</import>
5 <import>plot_macros.xml</import>
6 <import>tool-macros.xml</import>
7 </macros>
8 <expand macro="requirements"/>
9 <expand macro="stdio"/>
10 <expand macro="version_command"/>
11 <command><![CDATA[
12 echo {\"dataRoot\": \"$checkm_databases.fields.path\", \"remoteManifestURL\": \"https://data.ace.uq.edu.au/public/CheckM_databases/\", \"manifestType\": \"CheckM\", \"localManifestName\": \".dmanifest\", \"remoteManifestName\": \".dmanifest\"} > \${CONDA_PREFIX}/lib/python2.7/site-packages/checkm/DATA_CONFIG &&
13 mkdir bin_folder &&
14 #for $k, $f in enumerate($bin_folder)
15 #if $f
16 ln -s "${f}" bin_folder/${k}.fna &&
17 #end if
18 #end for
19
20 checkm lineage_wf
21 bin_folder
22 '$output.extra_files_path'
23 $reduced_tree
24 $ali
25 $nt
26 $genes
27 #if $unique and $unique is not None:
28 --unique $unique
29 #end if
30 #if $multi and $multi is not None:
31 --multi $multi
32 #end if
33 $force_domain
34 $no_refinement
35 $individual_markers
36 $skip_adj_correction
37 $skip_pseudogene_correction
38 #if $aai_strain and $aai_strain is not None:
39 --aai_strain $aai_strain
40 #end if
41 #if $alignment_file == "true":
42 --alignment_file $alignment_file_output
43 #end if
44 $ignore_thresholds
45 #if $e_value and $e_value is not None:
46 --e_value $e_value
47 #end if
48 #if $length and $length is not None:
49 --length $length
50 #end if
51 --tab_table
52 --threads \${GALAXY_SLOTS:-1}
53 > '$output'
54 #if str($ali) == "--ali" or str($nt) == "--nt":
55 &&if [ -d '$output.extra_files_path' ]; then
56 cp -r '$output.extra_files_path' out_folder;
57 fi
58 #end if
59
60 ## link hmmer alignments per bin in one dir to make them discoverable
61 #if str($ali) == "--ali":
62 && for k in `ls out_folder/bins/`; do
63 if [ -f out_folder/bins/\$k/hmmer.tree.txt ]; then
64 ln -s \$k/hmmer.tree.txt out_folder/bins/hmmer.tree.\$k.txt;
65 fi;
66 if [ -f out_folder/bins/\$k/hmmer.analyze.txt ]; then
67 ln -s \$k/hmmer.analyze.txt out_folder/bins/hmmer.analyze.\$k.txt;
68 fi;
69 done
70 #end if## link nucleotide sequences per bin in one dir to make them discoverable
71 #if str($nt) == "--nt":
72 && for k in `ls out_folder/bins/`; do
73 if [ -f out_folder/bins/\$k/genes.fna ]; then
74 ln -s \$k/genes.fna out_folder/bins/\$k.genes.fna;
75 fi;
76 done
77 #end if]]></command>
78 <inputs>
79 <param name="bin_folder" type="data" label="bins" multiple="true" format="fasta"/>
80 <param argument="--reduced_tree" checked="false" label="use reduced tree (requires &lt;16GB of memory) for determining lineage of each bin" name="reduced_tree" type="boolean" truevalue="--reduced_tree" falsevalue=""/>
81 <param argument="--ali" checked="false" label="generate HMMER alignment file for each bin" name="ali" type="boolean" truevalue="--ali" falsevalue=""/>
82 <param argument="--nt" checked="false" label="generate nucleotide gene sequences for each bin" name="nt" type="boolean" truevalue="--nt" falsevalue=""/>
83 <param argument="--genes" checked="false" label="bins contain genes as amino acids instead of nucleotide contigs" name="genes" type="boolean" truevalue="--genes" falsevalue=""/>
84 <param argument="--unique" label="minimum number of unique phylogenetic markers required to use lineage-specific marker set" name="unique" optional="true" type="integer" value="10"/>
85 <param argument="--multi" label="maximum number of multi-copy phylogenetic markers before defaulting to domain-level marker set" name="multi" optional="true" type="integer" value="10"/>
86 <param argument="--force_domain" checked="false" label="use domain-level sets for all bins" name="force_domain" type="boolean" truevalue="--force_domain" falsevalue=""/>
87 <param argument="--no_refinement" checked="false" label="do not perform lineage-specific marker set refinement" name="no_refinement" type="boolean" truevalue="--no_refinement" falsevalue=""/>
88 <param argument="--individual_markers" checked="false" label="treat marker as independent (i.e., ignore co-located set structure)" name="individual_markers" type="boolean" truevalue="--individual_markers" falsevalue=""/>
89 <param argument="--skip_adj_correction" checked="false" label="do not exclude adjacent marker genes when estimating contamination" name="skip_adj_correction" type="boolean" truevalue="--skip_adj_correction" falsevalue=""/>
90 <param argument="--skip_pseudogene_correction" checked="false" label="skip identification and filtering of pseudogenes" name="skip_pseudogene_correction" type="boolean" truevalue="--skip_pseudogene_correction" falsevalue=""/>
91 <param argument="--aai_strain" label="AAI threshold used to identify strain heterogeneity" name="aai_strain" optional="true" type="float" value="0.9"/>
92 <param argument="--alignment_file" label="produce file showing alignment of multi-copy genes and their AAI identity" name="alignment_file" type="boolean" truevalue="true" falsevalue="false" checked="false" />
93 <param argument="--ignore_thresholds" checked="false" label="ignore model-specific score thresholds" name="ignore_thresholds" type="boolean" truevalue="--ignore_thresholds" falsevalue=""/>
94 <param argument="--e_value" label="e-value cut off" name="e_value" optional="true" type="float" value="1e-10"/>
95 <param argument="--length" label="percent overlap between target and query" name="length" optional="true" type="float" value="0.7"/>
96
97 <param label="Select a database" name="checkm_databases" type="select">
98 <options from_data_table="checkm_databases">
99 <validator message="No database is available" type="no_options" />
100 </options>
101 </param>
102
103
104 </inputs>
105 <outputs>
106 <data name="alignment_file_output" format="txt" hidden="false" label="${tool.name} on ${on_string} (alignment)"><filter>alignment_file</filter></data>
107 <collection name="hmmer_nucleotide_per_bin" type="list" label="${tool.name} on ${on_string} (nucleotide gene sequences per bin)">
108 <filter>nt</filter>
109 <discover_datasets directory="out_folder/bins/" pattern="(?P&lt;designation&gt;.+).genes.fna" ext="fasta" />
110 </collection>
111 <collection name="hmmer_alignment_per_bin" type="list" label="${tool.name} on ${on_string} (HMMER alignments per bin)">
112 <filter>ali</filter>
113 <discover_datasets directory="out_folder/bins/" pattern="hmmer.(?P&lt;designation&gt;.+).txt" ext="txt" />
114 </collection>
115 <data name="output" format="tabular" hidden="false" label="${tool.name} on ${on_string}"/>
116 </outputs>
117 <tests>
118 <expand macro="tests"/>
119 </tests>
120 <help><![CDATA[Example: checkm lineage_wf ./bins ./output]]></help>
121 <expand macro="citations"/>
122 </tool>