|
0
|
1 <tool id="mafft1" name="MAFFT">
|
|
|
2 <description>, a progressive multiple alignment builder</description>
|
|
|
3 <command interpreter="bash">./mafft --quiet
|
|
|
4 #if $datatype_condition.type == "nt":
|
|
|
5 --nuc
|
|
|
6 #end if
|
|
|
7 #if $datatype_condition.type == "aa":
|
|
|
8 --amino
|
|
|
9 #end if
|
|
|
10 #if $datatype_condition.type != "nt":
|
|
|
11 #if $datatype_condition.PAM_value_condition.matrix == "bl30":
|
|
|
12 --bl 30
|
|
|
13 #end if
|
|
|
14 #if $datatype_condition.PAM_value_condition.matrix == "bl45":
|
|
|
15 --bl 45
|
|
|
16 #end if
|
|
|
17 #if $datatype_condition.PAM_value_condition.matrix == "bl62":
|
|
|
18 --bl 62
|
|
|
19 #end if
|
|
|
20 #if $datatype_condition.PAM_value_condition.matrix == "bl80":
|
|
|
21 --bl 80
|
|
|
22 #end if
|
|
|
23 #if $datatype_condition.PAM_value_condition.matrix == "PAM":
|
|
|
24 --jtt $datatype_condition.PAM_value_condition.PAM_value
|
|
|
25 #end if
|
|
|
26 #end if
|
|
|
27 --maxiterate $iterations --$distance_method --op $op --ep $ep $input > $output</command>
|
|
|
28 <inputs>
|
|
|
29 <param format="txt" name="input" type="data" label="Source file"/>
|
|
|
30 <conditional name="datatype_condition">
|
|
|
31 <param type="select" name="type" label="Data type">
|
|
|
32 <option value="auto">Automatic detection</option>
|
|
|
33 <option value="nt">Nucleic acids</option>
|
|
|
34 <option value="aa">Amino acids</option>
|
|
|
35 </param>
|
|
|
36 <when value="aa">
|
|
|
37 <conditional name="PAM_value_condition">
|
|
|
38 <param type="select" name="matrix" label="Matrix" help="Usefull only for amino acids">
|
|
|
39 <option value="bl62">BLOSUM 62</option>
|
|
|
40 <option value="bl30">BLOSUM 30</option>
|
|
|
41 <option value="bl45">BLOSUM 45</option>
|
|
|
42 <option value="bl80">BLOSUM 80</option>
|
|
|
43 <option value="PAM">PAM</option>
|
|
|
44 </param>
|
|
|
45 <when value="bl30"></when>
|
|
|
46 <when value="bl45"></when>
|
|
|
47 <when value="bl62"></when>
|
|
|
48 <when value="bl80"></when>
|
|
|
49 <when value="PAM">
|
|
|
50 <param type="text" name="PAM_value" help="Must be greater than 0" value="80" label="Coefficient of the PAM matrix" />
|
|
|
51 </when>
|
|
|
52 </conditional>
|
|
|
53 </when>
|
|
|
54 <when value="auto">
|
|
|
55 <conditional name="PAM_value_condition">
|
|
|
56 <param type="select" name="matrix" label="Matrix" help="Usefull only for amino acids">
|
|
|
57 <option value="bl62">BLOSUM 62</option>
|
|
|
58 <option value="bl30">BLOSUM 30</option>
|
|
|
59 <option value="bl45">BLOSUM 45</option>
|
|
|
60 <option value="bl80">BLOSUM 80</option>
|
|
|
61 <option value="PAM">PAM</option>
|
|
|
62 </param>
|
|
|
63 <when value="bl30"></when>
|
|
|
64 <when value="bl45"></when>
|
|
|
65 <when value="bl62"></when>
|
|
|
66 <when value="bl80"></when>
|
|
|
67 <when value="PAM">
|
|
|
68 <param type="text" name="PAM_value" help="Must be greater than 0" value="80" label="Coefficient of the PAM matrix" />
|
|
|
69 </when>
|
|
|
70 </conditional>
|
|
|
71 </when>
|
|
|
72 <when value="nt">
|
|
|
73 </when>
|
|
|
74 </conditional>
|
|
|
75 <param type="text" name="iterations" help="1000 for maximum quality" value="1000" label="Maximum number of iterations" />
|
|
|
76 <param type="text" name="op" help="1.53 default value" value="1.53" label="Gap opening penalty" />
|
|
|
77 <param type="text" name="ep" help="0.0 default value" value="0.0" label="Gap extension penalty" />
|
|
|
78 <param type="select" name="distance_method" label="Distance method" help="Distance method must be chosen regarding your data">
|
|
|
79 <option value="6merpair">Shared 6mers distance (fastest)</option>
|
|
|
80 <option value="globalpair">Global alignment (NW)</option>
|
|
|
81 <option value="localpair">Local alignment (SW)</option>
|
|
|
82 <option value="genafpair">Local, affine gap cost</option>
|
|
|
83 <option value="fastapair">FASTA distance</option>
|
|
|
84 </param>
|
|
|
85 </inputs>
|
|
|
86 <outputs>
|
|
|
87 <data format="fasta" name="output" />
|
|
|
88 </outputs>
|
|
|
89 <help>
|
|
|
90
|
|
|
91 .. class:: infomark
|
|
|
92
|
|
|
93 **Program encapsulated in Galaxy by Southgreen**
|
|
|
94
|
|
|
95
|
|
|
96 .. class:: infomark
|
|
|
97
|
|
|
98 **MAFFT version 6.717b, 2009**
|
|
|
99
|
|
|
100 -----
|
|
|
101
|
|
|
102 ==============
|
|
|
103 Please cite:
|
|
|
104 ==============
|
|
|
105
|
|
|
106 "Parallelization of the MAFFT multiple sequence alignment program.", **Katoh, Toh**, Bioinformatics 26:1899-1900, 2010. (describes the multithread version; Linux only)
|
|
|
107
|
|
|
108 "Multiple Alignment of DNA Sequences with MAFFT.", **Katoh, Asimenos, Toh**, Methods in Molecular Biology 537:39-64, 2009. (outlines DNA alignment methods and several tips including group-to-group alignment and rough clustering of a large number of sequences)
|
|
|
109
|
|
|
110 "Improved accuracy of multiple ncRNA alignment by incorporating structural information into a MAFFT-based framework.", **Katoh, Toh**, BMC Bioinformatics 9:212, 2008. (describes RNA structural alignment methods)
|
|
|
111
|
|
|
112 "Recent developments in the MAFFT multiple sequence alignment program.", **Katoh, Toh**, Briefings in Bioinformatics 9:286-298, 2008. (outlines version 6; Fast Breaking Paper in Thomson Reuters' ScienceWatch)
|
|
|
113
|
|
|
114 "PartTree: an algorithm to build an approximate tree from a large number of unaligned sequences." **Katoh, Toh**, Bioinformatics 23:372-374, Errata, 2007. (describes the PartTree algorithm)
|
|
|
115
|
|
|
116 "MAFFT version 5: improvement in accuracy of multiple sequence alignment.", **Katoh, Kuma, Toh, Miyata**, Nucleic Acids Res. 33:511-518, 2005. (describes [ancestral versions of] the G-INS-i, L-INS-i and E-INS-i strategies)
|
|
|
117
|
|
|
118 "MAFFT: a novel method for rapid multiple sequence alignment based on fast Fourier transform.", **Katoh, Misawa, Kuma, Miyata**, Nucleic Acids Res. 30:3059-3066, 2002.
|
|
|
119
|
|
|
120
|
|
|
121 -----
|
|
|
122
|
|
|
123 ==========
|
|
|
124 Overview
|
|
|
125 ==========
|
|
|
126
|
|
|
127 MAFFT is a multiple sequence alignment program for unix-like operating systems. It offers a range of multiple alignment methods, L-INS-i wich is accurate for alignment with less than 200 sequences, FFT-NS-2 which is fast for alignment with less than 10000 sequences.
|
|
|
128
|
|
|
129 -----
|
|
|
130
|
|
|
131 For further informations, please visite the MAFFT_ website.
|
|
|
132
|
|
|
133 .. _MAFFT: http://mafft.cbrc.jp/alignment/software/
|
|
|
134
|
|
|
135 </help>
|
|
|
136
|
|
|
137 </tool> |