comparison assembly_post_processor.xml @ 0:cecea7fdccf8 draft

Uploaded
author greg
date Fri, 09 Dec 2016 08:42:22 -0500
parents
children 974edd8437e2
comparison
equal deleted inserted replaced
-1:000000000000 0:cecea7fdccf8
1 <tool id="plant_tribes_assembly_post_processor" name="PlantTribes AssemblyPostProcessor" version="1.0.0">
2 <description>pipeline</description>
3 <requirements>
4 <requirement type="package" version="0.2">plant_tribes_assembly_post_processor</requirement>
5 </requirements>
6 <stdio>
7 <!-- Anything other than zero is an error -->
8 <exit_code range="1:" />
9 <!-- In case the return code has not been set properly check stderr too -->
10 <regex match="Error:" />
11 <regex match="Exception:" />
12 </stdio>
13 <command>
14 <![CDATA[
15 AssemblyPostProcesser
16 --transcripts "$input"
17 --prediction_method $prediction_method_cond.prediction_method
18 #if str($prediction_method_cond.prediction_method) == 'estscan':
19 --score_matrices "$score_matrices"
20 #end if
21 #if str($options_type.options_type_selector) == 'advanced':
22 #if str($options_type.target_gene_family_assembly_cond.target_gene_family_assembly) == 'yes':
23 --gene_family_search "$options_type.target_gene_family_assembly_cond.orthogroups"
24 --scaffold "$options_type.target_gene_family_assembly_cond.scaffold"
25 --method "$options_type.target_gene_family_assembly_cond.method"
26 #end if
27 --gap_trimming $options_type.gap_trimming
28 #if str($options_type.strand_specific) == 'yes':
29 --strand_specific
30 #end if
31 #if str($options_type.dereplicate) == 'yes':
32 --dereplicate
33 #end if
34 --min_length $options_type.min_length
35 #end if
36 --num_threads \${GALAXY_SLOTS:-4}
37 ]]>
38 </command>
39 <inputs>
40 <param name="input" format="fasta" type="data" label="De novo transcriptome assembly fasta file"/>
41 <conditional name="prediction_method_cond">
42 <param name="prediction_method" type="select" label="Prediction method for coding regions">
43 <option value="transdecoder" selected="true">TransDecoder</option>
44 <option value="estscan">ESTScan</option>
45 </param>
46 <when value="transdecoder" />
47 <when value="estscan">
48 <param name="score_matrices" format="smat" type="data" label="Scores matrices"/>
49 </when>
50 </conditional>
51 <conditional name="options_type">
52 <param name="options_type_selector" type="select" label="Options Configuration">
53 <option value="basic" selected="true">Basic</option>
54 <option value="advanced">Advanced</option>
55 </param>
56 <when value="basic" />
57 <when value="advanced">
58 <conditional name="target_gene_family_assembly_cond">
59 <param name="target_gene_family_assembly" type="select" label="Target gene family assembly?">
60 <option value="no" selected="true">No</option>
61 <option value="yes">Yes</option>
62 </param>
63 <when value="no" />
64 <when value="yes">
65 <param name="orthogroups" format="tabular" type="data" label="List of orthogroup identifiers for target gene families to assemble"/>
66 <param name="scaffold" type="select" label="Orthogroups or gene families proteins scaffold">
67 <options from_data_table="plant_tribes_scaffolds" />
68 <validator type="no_options" message="No PlantTribes scaffolds are available. Use the PlantTribes Scaffolds Download Data Manager tool to install and populate the PlantTribes scaffolds data table."/>
69 </param>
70 <param name="method" type="select" label="Protein clustering method">
71 <option value="gfam" selected="true">GFam</option>
72 <option value="orthofinder">OrthoFinder</option>
73 <option value="orthomcl">OrthoMCL</option>
74 </param>
75 </when>
76 </conditional>
77 <param name="gap_trimming" type="float" value="0.1" min="0" max="1.0" label="Remove gappy sites in alignments" help="0.1 removes sites with 90% gaps"/>
78 <param name="strand_specific" type="select" label="De novo transcriptome assembly was performed with strand-specific library?">
79 <option value="no" selected="true">No</option>
80 <option value="yes">Yes</option>
81 </param>
82 <param name="dereplicate" type="select" label="Remove repeated sequences in predicted coding regions?">
83 <option value="no" selected="true">No</option>
84 <option value="yes">Yes</option>
85 </param>
86 <param name="min_length" type="integer" value="200" label="Minimum sequence length of predicted coding regions"/>
87 </when>
88 </conditional>
89 </inputs>
90 <outputs>
91 <collection name="transcripts" type="list">
92 <discover_datasets pattern="__name__" directory="assemblyPostProcessing_dir" visible="false" ext="fasta" />
93 </collection>
94 </outputs>
95 <tests>
96 <test>
97 <param name="input" value="assembly.fasta" ftype="fasta" />
98 <param name="prediction_method" value="transdecoder" />
99 <param name="options_type_selector" value="advanced" />
100 <param name="strand_specific" value="yes" />
101 <param name="dereplicate" value="yes" />
102 <output_collection name="transcripts" type="list">
103 <element name="transcripts.cds" file="transcripts.cds" ftype="fasta" />
104 <element name="transcripts.cleaned.cds" file="transcripts.cleaned.cds" ftype="fasta" />
105 <element name="transcripts.cleaned.nr.cds" file="transcripts.cleaned.nr.cds" ftype="fasta" />
106 <element name="transcripts.cleaned.nr.pep" file="transcripts.cleaned.nr.pep" ftype="fasta" />
107 <element name="transcripts.cleaned.pep" file="transcripts.cleaned.pep" ftype="fasta" />
108 <element name="transcripts.pep" file="transcripts.pep" ftype="fasta" />
109 </output_collection>
110 </test>
111 </tests>
112 <help>
113 This tool is one of the PlantTribes' collection of automated modular analysis pipelines that utilize objective classifications of
114 complete protein sequences from sequenced plant genomes to perform comparative evolutionary studies. It post-processes de novo assembly
115 transcripts into putative coding sequences and their corresponding amino acid translations.
116
117 -----
118
119 **Options**
120
121 * **Prediction method for coding regions** - The prediction method for coding regions; one of ESTScan or TransDecoder.
122 * **Scores matrices** - Scores matrices that reflect the codons preferences in the studied organisms.
123 * **Target gene family assembly?** - Select yes to target gene families to assemble.
124 * **List of orthogroup identifiers for target gene families to assemble** - History item with a list of orthogroup identifiers for target gene families to assemble. The next version of this tool will use a dynamic select list for this feature.
125 * **Orthogroups or gene families proteins scaffold** - PlantTribes scaffolds data.
126 * **Protein clustering method** - One of GFam, OrthoFinder or OrthoMCL.
127 * **Remove gappy sites in alignments** - Removes gappy sites in alignments (i.e. 0.1 removes sites with 90% gaps): [0.0 to 1.0]
128 * **De novo transcriptome assembly was performed with strand-specific library?** - Select yes if de novo transcriptome assembly was performed with strand-specific library.
129 * **Remove repeated sequences in predicted coding regions?** - Select yes to remove repeated sequences in predicted coding regions.
130 * **Minimum sequence length of predicted coding regions** - Set the minimum sequence length of predicted coding regions.
131
132 </help>
133 <citations>
134 <citation type="bibtex">
135 @unpublished{None,
136 author = {None},
137 title = {None},
138 year = {None},
139 eprint = {None},
140 url = {None}
141 }</citation>
142 </citations>
143 </tool>