Mercurial > repos > greg > assembly_post_processor
comparison assembly_post_processor.xml @ 0:cecea7fdccf8 draft
Uploaded
author | greg |
---|---|
date | Fri, 09 Dec 2016 08:42:22 -0500 |
parents | |
children | 974edd8437e2 |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:cecea7fdccf8 |
---|---|
1 <tool id="plant_tribes_assembly_post_processor" name="PlantTribes AssemblyPostProcessor" version="1.0.0"> | |
2 <description>pipeline</description> | |
3 <requirements> | |
4 <requirement type="package" version="0.2">plant_tribes_assembly_post_processor</requirement> | |
5 </requirements> | |
6 <stdio> | |
7 <!-- Anything other than zero is an error --> | |
8 <exit_code range="1:" /> | |
9 <!-- In case the return code has not been set properly check stderr too --> | |
10 <regex match="Error:" /> | |
11 <regex match="Exception:" /> | |
12 </stdio> | |
13 <command> | |
14 <![CDATA[ | |
15 AssemblyPostProcesser | |
16 --transcripts "$input" | |
17 --prediction_method $prediction_method_cond.prediction_method | |
18 #if str($prediction_method_cond.prediction_method) == 'estscan': | |
19 --score_matrices "$score_matrices" | |
20 #end if | |
21 #if str($options_type.options_type_selector) == 'advanced': | |
22 #if str($options_type.target_gene_family_assembly_cond.target_gene_family_assembly) == 'yes': | |
23 --gene_family_search "$options_type.target_gene_family_assembly_cond.orthogroups" | |
24 --scaffold "$options_type.target_gene_family_assembly_cond.scaffold" | |
25 --method "$options_type.target_gene_family_assembly_cond.method" | |
26 #end if | |
27 --gap_trimming $options_type.gap_trimming | |
28 #if str($options_type.strand_specific) == 'yes': | |
29 --strand_specific | |
30 #end if | |
31 #if str($options_type.dereplicate) == 'yes': | |
32 --dereplicate | |
33 #end if | |
34 --min_length $options_type.min_length | |
35 #end if | |
36 --num_threads \${GALAXY_SLOTS:-4} | |
37 ]]> | |
38 </command> | |
39 <inputs> | |
40 <param name="input" format="fasta" type="data" label="De novo transcriptome assembly fasta file"/> | |
41 <conditional name="prediction_method_cond"> | |
42 <param name="prediction_method" type="select" label="Prediction method for coding regions"> | |
43 <option value="transdecoder" selected="true">TransDecoder</option> | |
44 <option value="estscan">ESTScan</option> | |
45 </param> | |
46 <when value="transdecoder" /> | |
47 <when value="estscan"> | |
48 <param name="score_matrices" format="smat" type="data" label="Scores matrices"/> | |
49 </when> | |
50 </conditional> | |
51 <conditional name="options_type"> | |
52 <param name="options_type_selector" type="select" label="Options Configuration"> | |
53 <option value="basic" selected="true">Basic</option> | |
54 <option value="advanced">Advanced</option> | |
55 </param> | |
56 <when value="basic" /> | |
57 <when value="advanced"> | |
58 <conditional name="target_gene_family_assembly_cond"> | |
59 <param name="target_gene_family_assembly" type="select" label="Target gene family assembly?"> | |
60 <option value="no" selected="true">No</option> | |
61 <option value="yes">Yes</option> | |
62 </param> | |
63 <when value="no" /> | |
64 <when value="yes"> | |
65 <param name="orthogroups" format="tabular" type="data" label="List of orthogroup identifiers for target gene families to assemble"/> | |
66 <param name="scaffold" type="select" label="Orthogroups or gene families proteins scaffold"> | |
67 <options from_data_table="plant_tribes_scaffolds" /> | |
68 <validator type="no_options" message="No PlantTribes scaffolds are available. Use the PlantTribes Scaffolds Download Data Manager tool to install and populate the PlantTribes scaffolds data table."/> | |
69 </param> | |
70 <param name="method" type="select" label="Protein clustering method"> | |
71 <option value="gfam" selected="true">GFam</option> | |
72 <option value="orthofinder">OrthoFinder</option> | |
73 <option value="orthomcl">OrthoMCL</option> | |
74 </param> | |
75 </when> | |
76 </conditional> | |
77 <param name="gap_trimming" type="float" value="0.1" min="0" max="1.0" label="Remove gappy sites in alignments" help="0.1 removes sites with 90% gaps"/> | |
78 <param name="strand_specific" type="select" label="De novo transcriptome assembly was performed with strand-specific library?"> | |
79 <option value="no" selected="true">No</option> | |
80 <option value="yes">Yes</option> | |
81 </param> | |
82 <param name="dereplicate" type="select" label="Remove repeated sequences in predicted coding regions?"> | |
83 <option value="no" selected="true">No</option> | |
84 <option value="yes">Yes</option> | |
85 </param> | |
86 <param name="min_length" type="integer" value="200" label="Minimum sequence length of predicted coding regions"/> | |
87 </when> | |
88 </conditional> | |
89 </inputs> | |
90 <outputs> | |
91 <collection name="transcripts" type="list"> | |
92 <discover_datasets pattern="__name__" directory="assemblyPostProcessing_dir" visible="false" ext="fasta" /> | |
93 </collection> | |
94 </outputs> | |
95 <tests> | |
96 <test> | |
97 <param name="input" value="assembly.fasta" ftype="fasta" /> | |
98 <param name="prediction_method" value="transdecoder" /> | |
99 <param name="options_type_selector" value="advanced" /> | |
100 <param name="strand_specific" value="yes" /> | |
101 <param name="dereplicate" value="yes" /> | |
102 <output_collection name="transcripts" type="list"> | |
103 <element name="transcripts.cds" file="transcripts.cds" ftype="fasta" /> | |
104 <element name="transcripts.cleaned.cds" file="transcripts.cleaned.cds" ftype="fasta" /> | |
105 <element name="transcripts.cleaned.nr.cds" file="transcripts.cleaned.nr.cds" ftype="fasta" /> | |
106 <element name="transcripts.cleaned.nr.pep" file="transcripts.cleaned.nr.pep" ftype="fasta" /> | |
107 <element name="transcripts.cleaned.pep" file="transcripts.cleaned.pep" ftype="fasta" /> | |
108 <element name="transcripts.pep" file="transcripts.pep" ftype="fasta" /> | |
109 </output_collection> | |
110 </test> | |
111 </tests> | |
112 <help> | |
113 This tool is one of the PlantTribes' collection of automated modular analysis pipelines that utilize objective classifications of | |
114 complete protein sequences from sequenced plant genomes to perform comparative evolutionary studies. It post-processes de novo assembly | |
115 transcripts into putative coding sequences and their corresponding amino acid translations. | |
116 | |
117 ----- | |
118 | |
119 **Options** | |
120 | |
121 * **Prediction method for coding regions** - The prediction method for coding regions; one of ESTScan or TransDecoder. | |
122 * **Scores matrices** - Scores matrices that reflect the codons preferences in the studied organisms. | |
123 * **Target gene family assembly?** - Select yes to target gene families to assemble. | |
124 * **List of orthogroup identifiers for target gene families to assemble** - History item with a list of orthogroup identifiers for target gene families to assemble. The next version of this tool will use a dynamic select list for this feature. | |
125 * **Orthogroups or gene families proteins scaffold** - PlantTribes scaffolds data. | |
126 * **Protein clustering method** - One of GFam, OrthoFinder or OrthoMCL. | |
127 * **Remove gappy sites in alignments** - Removes gappy sites in alignments (i.e. 0.1 removes sites with 90% gaps): [0.0 to 1.0] | |
128 * **De novo transcriptome assembly was performed with strand-specific library?** - Select yes if de novo transcriptome assembly was performed with strand-specific library. | |
129 * **Remove repeated sequences in predicted coding regions?** - Select yes to remove repeated sequences in predicted coding regions. | |
130 * **Minimum sequence length of predicted coding regions** - Set the minimum sequence length of predicted coding regions. | |
131 | |
132 </help> | |
133 <citations> | |
134 <citation type="bibtex"> | |
135 @unpublished{None, | |
136 author = {None}, | |
137 title = {None}, | |
138 year = {None}, | |
139 eprint = {None}, | |
140 url = {None} | |
141 }</citation> | |
142 </citations> | |
143 </tool> |