comparison phylogenomics_analysis.xml @ 41:6b547036c627 draft

Uploaded
author greg
date Thu, 02 Feb 2017 14:41:59 -0500
parents 0bf214a0646a
children 7e92ab9ee98a
comparison
equal deleted inserted replaced
40:0bf214a0646a 41:6b547036c627
18 18
19 #set scaffold_path = $scaffold.fields.path 19 #set scaffold_path = $scaffold.fields.path
20 #set scaffold_dir = $os.path.split($scaffold_path)[0] 20 #set scaffold_dir = $os.path.split($scaffold_path)[0]
21 #set scaffold_selection = $os.path.split($scaffold_path)[1] 21 #set scaffold_selection = $os.path.split($scaffold_path)[1]
22 #set src_fasta_dir = $os.path.join('phylogenomicsAnalysis_dir', 'orthogroups_fasta') 22 #set src_fasta_dir = $os.path.join('phylogenomicsAnalysis_dir', 'orthogroups_fasta')
23 #set dest_fasta_dir = $output_fasta.extra_files_path 23 #if str($input.ext) == 'ptcgf':
24 #set dest_fasta_dir = $output_fasta_ptcgf.extra_files_path
25 else:
26 #set dest_fasta_dir =$output_fasta_ptcgfcs.extra_files_path
27 #end if
24 28
25 #if str($options_type.options_type_selector) == 'advanced' and str($options_type.multiple_sequence_alignments_cond.multiple_sequence_alignments) == 'yes': 29 #if str($options_type.options_type_selector) == 'advanced' and str($options_type.multiple_sequence_alignments_cond.multiple_sequence_alignments) == 'yes':
26 #set generate_output_aln = True 30 #set generate_output_aln = True
27 #set src_aln_dir = $os.path.join('phylogenomicsAnalysis_dir', 'orthogroups_aln') 31 #set src_aln_dir = $os.path.join('phylogenomicsAnalysis_dir', 'orthogroups_aln')
28 #set dest_aln_dir = $output_aln.extra_files_path 32 #set dest_aln_dir = $output_aln.extra_files_path
89 93
90 #if str($input_includes_coding_sequences) == 'yes': 94 #if str($input_includes_coding_sequences) == 'yes':
91 #if str($multiple_codon_alignments) == 'yes': 95 #if str($multiple_codon_alignments) == 'yes':
92 --codon_alignments 96 --codon_alignments
93 #if str($use_corresponding_coding_sequences) == 'yes': 97 #if str($use_corresponding_coding_sequences) == 'yes':
94 #if str($input.ext) == 'pgfccs): 98 #if str($input.ext) == 'ptcgfcs):
95 --orthogroup_fna 99 --orthogroup_fna
96 #else: 100 #else:
97 raise Exception("Selected input does not include corresponding coding sequences") 101 raise Exception("Selected input does not include corresponding coding sequences")
98 #end if 102 #end if
99 #end if 103 #end if
131 #end if 135 #end if
132 #end if 136 #end if
133 #end if 137 #end if
134 #end if 138 #end if
135 139
136 && echo "Sequence alignments and corresponding phylogenies: `ls $src_fasta_dir | grep f | wc -l` files" > $output_fasta 140 #if str($input.ext) == 'ptcgf':
137 && ls -al $src_fasta_dir | grep f >> $output_fasta 141 && echo "Sequence alignments and corresponding phylogenies: `ls $src_fasta_dir | grep f | wc -l` files" > $output_fasta_ptcgf
142 && ls -al $src_fasta_dir | grep f >> $output_fasta_ptcgf
143 #else:
144 && echo "Sequence alignments and corresponding phylogenies: `ls $src_fasta_dir | grep f | wc -l` files" > $output_fasta_ptcgfcs
145 && ls -al $src_fasta_dir | grep f >> $output_fasta_ptcgfcs
146 #end if
138 && mv $src_fasta_dir/* $dest_fasta_dir || true 147 && mv $src_fasta_dir/* $dest_fasta_dir || true
139 148
140 #if $generate_output_aln: 149 #if $generate_output_aln:
141 && echo "Multiple sequence alignments using method '$multiple_sequence_alignments_option' (note that some files may be empty): `ls $src_aln_dir | grep f | wc -l` files" > $output_aln 150 && echo "Multiple sequence alignments using method '$multiple_sequence_alignments_option' (note that some files may be empty): `ls $src_aln_dir | grep f | wc -l` files" > $output_aln
142 && ls -al $src_aln_dir | grep f >> $output_aln 151 && ls -al $src_aln_dir | grep f >> $output_aln
149 && mv $src_tree_dir/* $dest_tree_dir || true 158 && mv $src_tree_dir/* $dest_tree_dir || true
150 #end if 159 #end if
151 ]]> 160 ]]>
152 </command> 161 </command>
153 <inputs> 162 <inputs>
154 <param name="input" format="pgfc,pgfccs" type="data" label="Select gene family clusters" help="Selection may optionally include corresponding coding sequences"/> 163 <param name="input" format="ptcgf,ptcgfcs" type="data" label="Select gene family clusters" help="Selection may optionally include corresponding coding sequences"/>
155 <param name="scaffold" type="select" label="Orthogroups or gene families proteins scaffold"> 164 <param name="scaffold" type="select" label="Orthogroups or gene families proteins scaffold">
156 <options from_data_table="plant_tribes_scaffolds" /> 165 <options from_data_table="plant_tribes_scaffolds" />
157 <validator type="no_options" message="No PlantTribes scaffolds are available. Use the PlantTribes Scaffolds Download Data Manager tool to install and populate the PlantTribes scaffolds data table."/> 166 <validator type="no_options" message="No PlantTribes scaffolds are available. Use the PlantTribes Scaffolds Download Data Manager tool to install and populate the PlantTribes scaffolds data table."/>
158 </param> 167 </param>
159 <param name="method" type="select" label="Protein clustering method"> 168 <param name="method" type="select" label="Protein clustering method">
281 </conditional> 290 </conditional>
282 </when> 291 </when>
283 </conditional> 292 </conditional>
284 </inputs> 293 </inputs>
285 <outputs> 294 <outputs>
286 <data name="output_fasta" format="txt" label="Sequence alignments and corresponding phylogenies on ${on_string}"/> 295 <data name="output_fasta_ptcgf" format="ptcgf" label="Sequence alignments and corresponding phylogenies on ${on_string}">
296 <filter>input.ext == 'ptcgf'</filter>
297 </data>
298 <data name="output_fasta_ptcgfcs" format="ptcgfcs" label="Sequence alignments and corresponding phylogenies on ${on_string}">
299 <filter>input.ext == 'ptcgfcs'</filter>
300 </data>
287 <data name="output_aln" format="txt" label="Multiple alignments on ${on_string}"> 301 <data name="output_aln" format="txt" label="Multiple alignments on ${on_string}">
288 <filter>options_type['options_type_selector'] == 'advanced' and options_type['multiple_sequence_alignments_cond']['multiple_sequence_alignments'] == 'yes'</filter> 302 <filter>options_type['options_type_selector'] == 'advanced' and options_type['multiple_sequence_alignments_cond']['multiple_sequence_alignments'] == 'yes'</filter>
289 </data> 303 </data>
290 <data name="output_tree" format="txt" label="Phylogenetic trees on ${on_string}"> 304 <data name="output_tree" format="ptpt" label="Phylogenetic trees on ${on_string}">
291 <filter>options_type['options_type_selector'] == 'advanced' and options_type['phylogenetic_trees_cond']['phylogenetic_trees'] == 'yes'</filter> 305 <filter>options_type['options_type_selector'] == 'advanced' and options_type['phylogenetic_trees_cond']['phylogenetic_trees'] == 'yes'</filter>
292 </data> 306 </data>
293 </outputs> 307 </outputs>
294 <tests> 308 <tests>
295 <test> 309 <test>
312 - **Protein clustering method** - One of GFam (domain architecture based clustering), OrthoFinder (broadly defined clusters) or OrthoMCL (narrowly defined clusters). 326 - **Protein clustering method** - One of GFam (domain architecture based clustering), OrthoFinder (broadly defined clusters) or OrthoMCL (narrowly defined clusters).
313 327
314 * **Multiple sequence alignments options** 328 * **Multiple sequence alignments options**
315 329
316 - **Select method for multiple sequence alignments** - Method used for setting multiple sequence alignments. 330 - **Select method for multiple sequence alignments** - Method used for setting multiple sequence alignments.
317 - **Input sequences include corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'pgfccs'. 331 - **Input sequences include corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'ptcgfcs'.
318 - **Construct orthogroup multiple codon alignments?** - Construct orthogroup multiple codon alignments. 332 - **Construct orthogroup multiple codon alignments?** - Construct orthogroup multiple codon alignments.
319 - **Sequence type used in the phylogenetic inference** - Sequence type (dna or amino acid) used in the phylogenetic inference. 333 - **Sequence type used in the phylogenetic inference** - Sequence type (dna or amino acid) used in the phylogenetic inference.
320 - **Use corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'pgfccs' or this tool will produce an error. 334 - **Use corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'ptcgfcs' or this tool will produce an error.
321 335
322 * **Phylogenetic trees options** 336 * **Phylogenetic trees options**
323 337
324 - **Phylogenetic trees inference method** - Phylogenetic trees inference method. 338 - **Phylogenetic trees inference method** - Phylogenetic trees inference method.
325 - **Select history item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees?** - If 'No' is selected, trees will be rooted using the most distant taxon present in the orthogroup. 339 - **Select history item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees?** - If 'No' is selected, trees will be rooted using the most distant taxon present in the orthogroup.