comparison phylogenomics_analysis.xml @ 51:32c3bf33cad7 draft

Uploaded
author greg
date Fri, 10 Feb 2017 09:05:32 -0500
parents ba0315c7b28b
children ebc846754dcb
comparison
equal deleted inserted replaced
50:ba0315c7b28b 51:32c3bf33cad7
1 <tool id="plant_tribes_phylogenomics_analysis" name="Create multiple sequence alignments" version="0.3"> 1 <tool id="plant_tribes_phylogenomics_analysis" name="Create multiple sequence alignments" version="0.3">
2 <description>and inferred maximum likelihood phylogenies</description> 2 <description>and inferred maximum likelihood phylogenies</description>
3 <requirements> 3 <requirements>
4 <requirement type="package" version="0.3">plant_tribes_phylogenomics_analysis</requirement> 4 <requirement type="package" version="0.3">plant_tribes_phylogenomics_analysis
5 </requirement>
5 </requirements> 6 </requirements>
6 <stdio> 7 <stdio>
7 <!-- Anything other than zero is an error --> 8 <!-- Anything other than zero is an error -->
8 <exit_code range="1:" /> 9 <exit_code range="1:" />
9 <exit_code range=":-1" /> 10 <exit_code range=":-1" />
23 #set scaffold_selection = $os.path.split($scaffold_path)[1] 24 #set scaffold_selection = $os.path.split($scaffold_path)[1]
24 #set src_aln_dir = $os.path.join($pipeline_output_dir, 'orthogroups_aln') 25 #set src_aln_dir = $os.path.join($pipeline_output_dir, 'orthogroups_aln')
25 #set src_fasta_dir = $os.path.join($pipeline_output_dir, 'orthogroups_fasta') 26 #set src_fasta_dir = $os.path.join($pipeline_output_dir, 'orthogroups_fasta')
26 #set src_tree_dir = $os.path.join($pipeline_output_dir, 'orthogroups_tree') 27 #set src_tree_dir = $os.path.join($pipeline_output_dir, 'orthogroups_tree')
27 28
28 #if str($input_format) == 'ptcgf': 29 #if str($input_format) == 'ptortho':
29 #set dest_fasta_dir = $output_fasta_ptcgf.extra_files_path 30 #set dest_fasta_dir = $output_fasta_ptortho.extra_files_path
30 #set multiple_codon_alignments = 'no' 31 #set multiple_codon_alignments = 'no'
31 #set use_corresponding_coding_sequences = 'no' 32 #set use_corresponding_coding_sequences = 'no'
32 #else: 33 #else:
33 #set dest_fasta_dir = $output_fasta_ptcgfcs.extra_files_path 34 #set dest_fasta_dir = $output_fasta_ptorthocs.extra_files_path
34 #set multiple_codon_alignments_cond = $input_format_cond.multiple_codon_alignments_cond 35 #set multiple_codon_alignments_cond = $input_format_cond.multiple_codon_alignments_cond
35 #set multiple_codon_alignments = $multiple_codon_alignments_cond.multiple_codon_alignments 36 #set multiple_codon_alignments = $multiple_codon_alignments_cond.multiple_codon_alignments
36 #if str($multiple_codon_alignments) == 'yes': 37 #if str($multiple_codon_alignments) == 'yes':
37 #set use_corresponding_coding_sequences_cond = $multiple_codon_alignments_cond.use_corresponding_coding_sequences_cond 38 #set use_corresponding_coding_sequences_cond = $multiple_codon_alignments_cond.use_corresponding_coding_sequences_cond
38 #set use_corresponding_coding_sequences = $use_corresponding_coding_sequences_cond.use_corresponding_coding_sequences 39 #set use_corresponding_coding_sequences = $use_corresponding_coding_sequences_cond.use_corresponding_coding_sequences
66 #set generate_output_tree = False 67 #set generate_output_tree = False
67 #end if 68 #end if
68 69
69 PhylogenomicsAnalysis 70 PhylogenomicsAnalysis
70 --num_threads \${GALAXY_SLOTS:-4} 71 --num_threads \${GALAXY_SLOTS:-4}
71 #if str($input_format) == 'ptcgf': 72 #if str($input_format) == 'ptortho':
72 --orthogroup_faa '$input_format_cond.input_ptcgf.extra_files_path' 73 --orthogroup_faa '$input_format_cond.input_ptortho.extra_files_path'
73 #else: 74 #else:
74 --orthogroup_faa '$input_format_cond.input_ptcgfcs.extra_files_path' 75 --orthogroup_faa '$input_format_cond.input_ptorthocs.extra_files_path'
75 #end if 76 #end if
76 --scaffold_dir '$scaffold_dir' 77 --scaffold_dir '$scaffold_dir'
77 --scaffold '$scaffold_selection' 78 --scaffold '$scaffold_selection'
78 --method $method 79 --method $method
79 80
119 #end if 120 #end if
120 #end if 121 #end if
121 #end if 122 #end if
122 #end if 123 #end if
123 124
124 #if str($input_format) == 'ptcgf': 125 && echo "Sequence alignments and corresponding phylogenies"
125 && echo "Sequence alignments and corresponding phylogenies: `ls $src_fasta_dir | grep f | wc -l` files" > $output_fasta_ptcgf 126 #if str($input_format) == 'ptortho':
126 && ls -al $src_fasta_dir | grep f >> $output_fasta_ptcgf 127 && echo -e "#Size\tName" > $output_fasta_ptortho
127 #else: 128 && ls -l $src_fasta_dir | grep f | awk -F ' ' '{print $5"\t"$9}' >> $output_fasta_ptortho
128 && echo "Sequence alignments and corresponding phylogenies: `ls $src_fasta_dir | grep f | wc -l` files" > $output_fasta_ptcgfcs 129 #else:
129 && ls -al $src_fasta_dir | grep f >> $output_fasta_ptcgfcs 130 && echo -e "#Size\tName" > $output_fasta_ptorthocs
130 #end if 131 && ls -l $src_fasta_dir | grep f | awk -F ' ' '{print $5"\t"$9}' >> $output_fasta_ptorthocs
131 132 #end if
132 && mv $src_fasta_dir/* $dest_fasta_dir || true 133 && mv $src_fasta_dir/* $dest_fasta_dir || true
133 134
134 #if $generate_output_aln: 135 #if $generate_output_aln:
135 && echo "Multiple sequence alignments using method '$multiple_sequence_alignments_option' (note that some files may be empty): `ls $src_aln_dir | grep f | wc -l` files" > $output_aln 136 && echo -e "#Size\tName" > $output_aln
136 && ls -al $src_aln_dir | grep f >> $output_aln 137 && ls -l $src_aln_dir | grep f | awk -F ' ' '{print $5"\t"$9}' >> $output_aln
137 && mv $src_aln_dir/* $dest_aln_dir || true 138 && mv $src_aln_dir/* $dest_aln_dir || true
138 #end if 139 #end if
139 140
140 #if $generate_output_tree: 141 #if $generate_output_tree:
141 && echo "Phylogenetic trees (note that some files may be empty): `ls $src_tree_dir | grep f | wc -l` files" > $output_tree 142 && echo -e "#Size\tName" > $output_tree
142 && ls -al $src_tree_dir | grep f >> $output_tree 143 && ls -l $src_tree_dir | grep f | awk -F ' ' '{print $5"\t"$9}' >> $output_tree
143 && mv $src_tree_dir/* $dest_tree_dir || true 144 && mv $src_tree_dir/* $dest_tree_dir || true
144 #end if 145 #end if
145 ]]> 146 ]]>
146 </command> 147 </command>
147 <inputs> 148 <inputs>
148 <conditional name="input_format_cond"> 149 <conditional name="input_format_cond">
149 <param name="input_format" type="select" label="Select type of data to sub sample"> 150 <param name="input_format" type="select" label="Select type of data to sub sample">
150 <option value="ptcgf">Gene family clusters</option> 151 <option value="ptortho">Gene family clusters</option>
151 <option value="ptcgfcs">Gene family clusters and corresponding coding sequences</option> 152 <option value="ptorthocs">Gene family clusters and corresponding coding sequences</option>
152 </param> 153 </param>
153 <when value="ptcgf"> 154 <when value="ptortho">
154 <param name="input_ptcgf" format="ptcgf" type="data" label="Gene family clusters"/> 155 <param name="input_ptortho" format="ptortho" type="data" label="Precomputed orthologous gene family clusters" />
155 </when> 156 </when>
156 <when value="ptcgfcs"> 157 <when value="ptorthocs">
157 <param name="input_ptcgfcs" format="ptcgfcs" type="data" label="Gene family clusters with corresponding coding sequences"/> 158 <param name="input_ptorthocs" format="ptorthocs" type="data" label="Precomputed orthologous gene family clusters with corresponding coding sequences" />
158 <conditional name="multiple_codon_alignments_cond"> 159 <conditional name="multiple_codon_alignments_cond">
159 <param name="multiple_codon_alignments" type="select" label="Construct orthogroup multiple codon alignments?"> 160 <param name="multiple_codon_alignments" type="select" label="Construct orthogroup multiple codon alignments?">
160 <option value="no" selected="True">No</option> 161 <option value="no" selected="True">No</option>
161 <option value="yes">Yes</option> 162 <option value="yes">Yes</option>
162 </param> 163 </param>
163 <when value="no"/> 164 <when value="no" />
164 <when value="yes"> 165 <when value="yes">
165 <param name="sequence_type" type="select" label="Sequence type used in the phylogenetic inference - (dna)"> 166 <param name="sequence_type" type="select" label="Sequence type used in the phylogenetic inference (dna)">
166 <option value="protein" selected="true">Amino acid based</option> 167 <option value="protein" selected="true">Amino acid based</option>
167 <option value="dna">Nucleotide based</option> 168 <option value="dna">Nucleotide based</option>
168 </param> 169 </param>
169 <conditional name="use_corresponding_coding_sequences_cond"> 170 <conditional name="use_corresponding_coding_sequences_cond">
170 <param name="use_corresponding_coding_sequences" type="select" label="Use corresponding coding sequences?"> 171 <param name="use_corresponding_coding_sequences" type="select" label="Use corresponding coding sequences?">
178 </conditional> 179 </conditional>
179 </when> 180 </when>
180 </conditional> 181 </conditional>
181 <param name="scaffold" type="select" label="Orthogroups or gene families proteins scaffold"> 182 <param name="scaffold" type="select" label="Orthogroups or gene families proteins scaffold">
182 <options from_data_table="plant_tribes_scaffolds" /> 183 <options from_data_table="plant_tribes_scaffolds" />
183 <validator type="no_options" message="No PlantTribes scaffolds are available. Use the PlantTribes Scaffolds Download Data Manager tool in Galaxy to install and populate the PlantTribes scaffolds data table."/> 184 <validator type="no_options" message="No PlantTribes scaffolds are available. Use the PlantTribes Scaffolds Download Data Manager tool in Galaxy to install and populate the PlantTribes scaffolds data table." />
184 </param> 185 </param>
185 <param name="method" type="select" label="Protein clustering method"> 186 <param name="method" type="select" label="Protein clustering method">
186 <option value="gfam" selected="true">GFam</option> 187 <option value="gfam" selected="true">GFam</option>
187 <option value="orthofinder">OrthoFinder</option> 188 <option value="orthofinder">OrthoFinder</option>
188 <option value="orthomcl">OrthoMCL</option> 189 <option value="orthomcl">OrthoMCL</option>
200 <option value="yes">Yes</option> 201 <option value="yes">Yes</option>
201 </param> 202 </param>
202 <when value="no" /> 203 <when value="no" />
203 <when value="yes"> 204 <when value="yes">
204 <conditional name="multiple_sequence_alignments_option_cond"> 205 <conditional name="multiple_sequence_alignments_option_cond">
205 <param name="multiple_sequence_alignments_option" label="Select method for multiple sequence alignments" type="select" force_select="True"> 206 <param name="multiple_sequence_alignments_option" label="Select method for multiple sequence alignments" type="select"
207 force_select="True">
206 <option value="create_alignments">Create orthogroup protein multiple sequence alignments including scaffold backbone proteins (MAFFT algorithm)</option> 208 <option value="create_alignments">Create orthogroup protein multiple sequence alignments including scaffold backbone proteins (MAFFT algorithm)</option>
207 <option value="add_alignments">Add unaligned orthogroup proteins to scaffold backbone multiple sequence alignments (MAFFT algorithm)</option> 209 <option value="add_alignments">Add unaligned orthogroup proteins to scaffold backbone multiple sequence alignments (MAFFT algorithm)</option>
208 <option value="pasta_alignments">Create orthogroup protein multiple sequence alignments including scaffold backbone proteins (PASTA algorithm)</option> 210 <option value="pasta_alignments">Create orthogroup protein multiple sequence alignments including scaffold backbone proteins (PASTA algorithm)</option>
209 </param> 211 </param>
210 <when value="create_alignments"/> 212 <when value="create_alignments" />
211 <when value="add_alignments"/> 213 <when value="add_alignments" />
212 <when value="pasta_alignments"> 214 <when value="pasta_alignments">
213 <param name="pasta_iter_limit" type="integer" value="3" min="0" label="Maximum number of iteration that the PASTA algorithm will run"/> 215 <param name="pasta_iter_limit" type="integer" value="3" min="0" label="Maximum number of iteration that the PASTA algorithm will run" />
214 </when> 216 </when>
215 </conditional> 217 </conditional>
216 </when> 218 </when>
217 </conditional> 219 </conditional>
218 <conditional name="phylogenetic_trees_cond"> 220 <conditional name="phylogenetic_trees_cond">
231 <conditional name="rooting_order_file_cond"> 233 <conditional name="rooting_order_file_cond">
232 <param name="rooting_order_file" type="select" label="Select history item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees?"> 234 <param name="rooting_order_file" type="select" label="Select history item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees?">
233 <option value="no" selected="true">No</option> 235 <option value="no" selected="true">No</option>
234 <option value="yes">Yes</option> 236 <option value="yes">Yes</option>
235 </param> 237 </param>
236 <when value="no"/> 238 <when value="no" />
237 <when value="yes"> 239 <when value="yes">
238 <param name="rooting_order" format="txt" type="data" label="History item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees"/> 240 <param name="rooting_order" format="txt" type="data" label="History item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees" />
239 </when> 241 </when>
240 </conditional> 242 </conditional>
241 <param name="bootstrap_replicates" type="integer" value="100" min="0" label="Number of replicates for rapid bootstrap analysis and search for the best-scoring ML tree"/> 243 <param name="bootstrap_replicates" type="integer" value="100" min="0" label="Number of replicates for rapid bootstrap analysis and search for the best-scoring ML tree" />
242 </when> 244 </when>
243 <when value="fasttree"/> 245 <when value="fasttree" />
244 </conditional> 246 </conditional>
245 <param name="max_orthogroup_size" type="integer" value="100" min="0" label="Maximum number of sequences in orthogroup alignments"/> 247 <param name="max_orthogroup_size" type="integer" value="100" min="0" label="Maximum number of sequences in orthogroup alignments" />
246 <param name="min_orthogroup_size" type="integer" value="4" min="0" label="Minimum number of sequences in orthogroup alignments"/> 248 <param name="min_orthogroup_size" type="integer" value="4" min="0" label="Minimum number of sequences in orthogroup alignments" />
247 </when> 249 </when>
248 </conditional> 250 </conditional>
249 <conditional name="msa_quality_control_options_cond"> 251 <conditional name="msa_quality_control_options_cond">
250 <param name="msa_quality_control_options" type="select" label="Set MSA quality control options?"> 252 <param name="msa_quality_control_options" type="select" label="Set MSA quality control options?">
251 <option value="no" selected="true">No</option> 253 <option value="no" selected="true">No</option>
256 <conditional name="remove_gappy_sequences_cond"> 258 <conditional name="remove_gappy_sequences_cond">
257 <param name="remove_gappy_sequences" type="select" label="Remove gappy sequences in alignments?"> 259 <param name="remove_gappy_sequences" type="select" label="Remove gappy sequences in alignments?">
258 <option value="no" selected="true">No</option> 260 <option value="no" selected="true">No</option>
259 <option value="yes">Yes</option> 261 <option value="yes">Yes</option>
260 </param> 262 </param>
261 <when value="no"/> 263 <when value="no" />
262 <when value="yes"> 264 <when value="yes">
263 <param name="remove_sequences" type="float" value="0.5" min="0" max="1" label="Remove sequences with gaps of" help="0.5 removes sequences with 50% gaps"/> 265 <param name="remove_sequences" type="float" value="0.5" min="0" max="1" label="Remove sequences with gaps of" help="0.5 removes sequences with 50% gaps" />
264 <conditional name="trim_type_cond"> 266 <conditional name="trim_type_cond">
265 <param name="trim_type" type="select" label="Select process used for gap trimming"> 267 <param name="trim_type" type="select" label="Select process used for gap trimming">
266 <option value="gap_trimming" selected="true">Nucleotide based</option> 268 <option value="gap_trimming" selected="true">Nucleotide based </option>
267 <option value="automated_trimming">Trim alignments using trimAl's ML heuristic trimming approach</option> 269 <option value="automated_trimming">Trim alignments using trimAl's ML heuristic trimming approach</option>
268 </param> 270 </param>
269 <when value="automated_trimming"/> 271 <when value="automated_trimming" />
270 <when value="gap_trimming"> 272 <when value="gap_trimming">
271 <param name="gap_trimming" type="float" value="0.1" min="0" max="1.0" label="Remove sites in alignments with gaps of" help="0.1 removes sites with 90% gaps"/> 273 <param name="gap_trimming" type="float" value="0.1" min="0" max="1.0" label="Remove sites in alignments with gaps of" help="0.1 removes sites with 90% gaps" />
272 </when> 274 </when>
273 </conditional> 275 </conditional>
274 </when> 276 </when>
275 </conditional> 277 </conditional>
276 </when> 278 </when>
277 </conditional> 279 </conditional>
278 </when> 280 </when>
279 </conditional> 281 </conditional>
280 </inputs> 282 </inputs>
281 <outputs> 283 <outputs>
282 <data name="output_fasta_ptcgf" format="ptcgf"> 284 <data name="output_fasta_ptortho" format="ptortho">
283 <filter>input_format_cond['input_format'] == 'ptcgf'</filter> 285 <filter>input_format_cond['input_format'] == 'ptortho'</filter>
284 </data> 286 </data>
285 <data name="output_fasta_ptcgfcs" format="ptcgfcs"> 287 <data name="output_fasta_ptorthocs" format="ptorthocs">
286 <filter>input_format_cond['input_format'] == 'ptcgfcs'</filter> 288 <filter>input_format_cond['input_format'] == 'ptorthocs'</filter>
287 </data> 289 </data>
288 <data name="output_aln" format="txt" label="Multiple alignments on ${on_string}"> 290 <data name="output_aln" format="txt" label="Multiple alignments using method ${options_type['multiple_sequence_alignments_cond']['multiple_sequence_alignments_option_cond']['multiple_sequence_alignments_option']} on ${on_string}">
289 <filter>options_type['options_type_selector'] == 'advanced' and options_type['multiple_sequence_alignments_cond']['multiple_sequence_alignments'] == 'yes'</filter> 291 <filter>options_type['options_type_selector'] == 'advanced' and options_type['multiple_sequence_alignments_cond']['multiple_sequence_alignments'] == 'yes'</filter>
290 </data> 292 </data>
291 <data name="output_tree" format="ptpt" label="Phylogenetic trees on ${on_string}"> 293 <data name="output_tree" format="ptpt" label="Phylogenetic trees on ${on_string}">
292 <filter>options_type['options_type_selector'] == 'advanced' and options_type['phylogenetic_trees_cond']['phylogenetic_trees'] == 'yes'</filter> 294 <filter>options_type['options_type_selector'] == 'advanced' and options_type['phylogenetic_trees_cond']['phylogenetic_trees'] == 'yes'</filter>
293 </data> 295 </data>
295 <tests> 297 <tests>
296 <test> 298 <test>
297 </test> 299 </test>
298 </tests> 300 </tests>
299 <help> 301 <help>
300 This tool is one of the PlantTribes' collection of automated modular analysis pipelines that utilize objective classifications of 302 This tool is one of the PlantTribes' collection of automated modular analysis pipelines that utilize objective classifications of
301 complete protein sequences from sequenced plant genomes to perform comparative evolutionary studies. It performs phylogenomic 303 complete protein sequences from sequenced plant genomes to perform comparative evolutionary studies. It performs phylogenomic
302 analyses by creating multiple sequence alignments and inferred maximum likelihood phylogenies for orthogroups produced by the 304 analyses by creating multiple sequence alignments and inferred maximum likelihood phylogenies for orthogroups produced by the
303 **Classify gene sequences into precomputed orthologous gene family clusters** tool. 305 **Classify gene sequences into precomputed orthologous gene family clusters** tool.
304 306
305 ----- 307 -----
306 308
307 **Options** 309 **Options**
308 310
309 * **Required options** 311 * **Required options**
310 312
311 - **Select gene family clusters** - Sequences classified into gene family clusters, optionally including corresponding coding sequences. 313 - **Select gene family clusters** - Sequences classified into gene family clusters, optionally including corresponding coding sequences.
312 - **Orthogroups or gene families proteins scaffold** - PlantTribes scaffolds data. 314 - **Orthogroups or gene families proteins scaffold** - PlantTribes scaffolds data.
313 - **Protein clustering method** - One of GFam (domain architecture based clustering), OrthoFinder (broadly defined clusters) or OrthoMCL (narrowly defined clusters). 315 - **Protein clustering method** - One of GFam (domain architecture based clustering), OrthoFinder (broadly defined clusters) or OrthoMCL (narrowly defined clusters).
314 316 * **Multiple sequence alignments options**
315 * **Multiple sequence alignments options** 317
316 318 - **Select method for multiple sequence alignments** - Method used for setting multiple sequence alignments.
317 - **Select method for multiple sequence alignments** - Method used for setting multiple sequence alignments. 319 - **Input sequences include corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'ptorthocs'.
318 - **Input sequences include corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'ptcgfcs'. 320 - **Construct orthogroup multiple codon alignments?** - Construct orthogroup multiple codon alignments.
319 - **Construct orthogroup multiple codon alignments?** - Construct orthogroup multiple codon alignments. 321 - **Sequence type used in the phylogenetic inference** - Sequence type (dna or amino acid) used in the phylogenetic inference.
320 - **Sequence type used in the phylogenetic inference** - Sequence type (dna or amino acid) used in the phylogenetic inference. 322 - **Use corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'ptorthocs' or this tool will produce an error.
321 - **Use corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'ptcgfcs' or this tool will produce an error. 323
322 324 * **Phylogenetic trees options**
323 * **Phylogenetic trees options** 325
324 326 - **Phylogenetic trees inference method** - Phylogenetic trees inference method.
325 - **Phylogenetic trees inference method** - Phylogenetic trees inference method. 327 - **Select history item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees?** - If 'No' is selected, trees will be rooted using the most distant taxon present in the orthogroup.
326 - **Select history item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees?** - If 'No' is selected, trees will be rooted using the most distant taxon present in the orthogroup. 328 - **History item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees** - History item containing a set of string fragments matching sequences identifiers of species in the classification (including scaffold taxa) to be used for determining the most basal taxa in the orthogroups for rooting trees. The set of string fragments must be listed in decreasing order from older to younger lineages.
327 - **History item containing strings matching sequence identifiers of species for determining the most basal taxa in the orthogroups for rooting trees** - History item containing a set of string fragments matching sequences identifiers of species in the classification (including scaffold taxa) to be used for determining the most basal taxa in the orthogroups for rooting trees. The set of string fragments must be listed in decreasing order from older to younger lineages. 329 - **Number of replicates for rapid bootstrap analysis and search for the best-scoring ML tree** - Number of replicates for rapid bootstrap analysis and search for the best-scoring ML tree.
328 - **Number of replicates for rapid bootstrap analysis and search for the best-scoring ML tree** - Number of replicates for rapid bootstrap analysis and search for the best-scoring ML tree. 330 - **Maximum number of sequences in orthogroup alignments** - Maximum number of sequences in orthogroup alignments.
329 - **Maximum number of sequences in orthogroup alignments** - Maximum number of sequences in orthogroup alignments. 331 - **Minimum number of sequences in orthogroup alignments** - Minimum number of sequences in orthogroup alignments.
330 - **Minimum number of sequences in orthogroup alignments** - Minimum number of sequences in orthogroup alignments. 332
331 333 * **MSA quality control options**
332 * **MSA quality control options** 334
333 335 - **Remove sequences with gaps of** - Removes gappy sequences in alignments (i.e., 0.5 removes sequences with 50% gaps).
334 - **Remove sequences with gaps of** - Removes gappy sequences in alignments (i.e., 0.5 removes sequences with 50% gaps). 336 - **Select process used for gap trimming** - Either nucleotide based trimming or alignments are trimed using using trimAl's ML heuristic trimming approach.
335 - **Select process used for gap trimming** - Either nucleotide based trimming or alignments are trimed using using trimAl's ML heuristic trimming approach. 337 - **Remove sites in alignments with gaps of** - If the process used for gap trimming is nucleotide based, this is the gap value used when removing gappy sites in alignments (i.e., 0.1 removes sites with 90% gaps).
336 - **Remove sites in alignments with gaps of** - If the process used for gap trimming is nucleotide based, this is the gap value used when removing gappy sites in alignments (i.e., 0.1 removes sites with 90% gaps).
337 338
338 </help> 339 </help>
339 <citations> 340 <citations>
340 <citation type="bibtex"> 341 <citation type="bibtex">
341 @unpublished{None, 342 @unpublished{None,
342 author = {Eric Wafula}, 343 author = {Eric Wafula},
343 title = {None}, 344 title = {None},
344 year = {None}, 345 year = {None},
345 url = {https://github.com/dePamphilis/PlantTribes} 346 url = {https://github.com/dePamphilis/PlantTribes}
346 }</citation> 347 }
347 <citation type="doi">10.1093/bioinformatics/btw412</citation> 348 </citation>
348 <citation type="bibtex"> 349 <citation type="doi">10.1093/bioinformatics/btw412</citation>
349 @published{Research in Computational Molecular Biology (RECOMB) (pp. 177–191), 350 <citation type="bibtex">
350 author = {Mirarab, S., Nguyen, N., Warnow, T.}, 351 @published{Research in Computational Molecular Biology (RECOMB) (pp. 177–191),
351 title = {PASTA: Ultra-Large Multiple Sequence Alignment. In R. Sharan (Ed.)}, 352 author = {Mirarab, S., Nguyen, N., Warnow, T.},
352 year = {2014}, 353 title = {PASTA: Ultra-Large Multiple Sequence Alignment. In R. Sharan
353 url = {https://github.com/smirarab/pasta} 354 (Ed.)},
354 }</citation> 355 year = {2014},
355 <citation type="bibtex"> 356 url = {https://github.com/smirarab/pasta}
356 @published{Bioinformatics, 357 }
357 author = {Salvador Capella-Gutierrez, Jose M. Silla-Martinez, Toni Gabaldon}, 358 </citation>
358 title = {trimAl: a tool for automated alignment trimming in large-scale phylogenetic analyses}, 359 <citation type="bibtex">
359 year = {2009}, 360 @published{Bioinformatics,
360 url = {http://trimal.cgenomics.org} 361 author = {Salvador Capella-Gutierrez, Jose M. Silla-Martinez, Toni
361 }</citation> 362 Gabaldon},
362 <citation type="bibtex"> 363 title = {trimAl: a tool for automated alignment trimming in large-scale
363 @published{Bioinformatics, 364 phylogenetic analyses},
364 author = {A. Stamatakis}, 365 year = {2009},
365 title = {RAxML Version 8: A tool for Phylogenetic Analysis and Post-Analysis of Large Phylogenies}, 366 url = {http://trimal.cgenomics.org}
366 year = {2014}, 367 }
367 url = {http://sco.h-its.org/exelixis/web/software/raxml/index.html} 368 </citation>
368 }</citation> 369 <citation type="bibtex">
369 <citation type="doi">10.1371/journal.pone.0009490</citation> 370 @published{Bioinformatics,
371 author = {A. Stamatakis},
372 title = {RAxML Version 8: A tool for Phylogenetic Analysis and
373 Post-Analysis of Large Phylogenies},
374 year = {2014},
375 url = {http://sco.h-its.org/exelixis/web/software/raxml/index.html}
376 }
377 </citation>
378 <citation type="doi">10.1371/journal.pone.0009490</citation>
370 </citations> 379 </citations>
371 </tool> 380 </tool>