Mercurial > repos > devteam > fasta_to_tabular
annotate fasta_to_tabular.xml @ 3:5b998d13de71 draft default tip
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit 34a6c9f94a5722bb7d2f887618aafa410a770e91"
author | devteam |
---|---|
date | Mon, 02 Mar 2020 11:46:30 +0000 |
parents | ff4751ce764d |
children |
rev | line source |
---|---|
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
1 <tool id="fasta2tab" name="FASTA-to-Tabular" version="1.1.1" profile="16.04"> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
2 <description>converter</description> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
3 <requirements> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
4 <requirement type="package" version="3.7">python</requirement> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
5 </requirements> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
6 <command> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
7 python '$__tool_directory__/fasta_to_tabular.py' '$input' '$output' $keep_first $descr_columns |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
8 </command> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
9 <inputs> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
10 <param name="input" type="data" format="fasta" label="Convert these sequences"/> |
3
5b998d13de71
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit 34a6c9f94a5722bb7d2f887618aafa410a770e91"
devteam
parents:
2
diff
changeset
|
11 <param name="descr_columns" type="integer" value="1" min="1" label="How many columns to divide title string into?" help="Typically 2 to take the ID (first word) and decription (rest) as two columns, or 1 to give a single column"/> |
5b998d13de71
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit 34a6c9f94a5722bb7d2f887618aafa410a770e91"
devteam
parents:
2
diff
changeset
|
12 <param name="keep_first" type="integer" value="0" min="0" label="How many title characters to keep?" help="Applies only to the first column taken from the title string ('0' = keep the whole thing), useful when your sequence identifiers are all the same length."/> |
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
13 </inputs> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
14 <outputs> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
15 <data name="output" format="tabular"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
16 </outputs> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
17 <tests> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
18 <test> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
19 <param name="input" value="454.fasta" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
20 <param name="descr_columns" value="1"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
21 <param name="keep_first" value="0"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
22 <output name="output" file="fasta_to_tabular_out1.tabular" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
23 </test> |
0 | 24 |
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
25 <test> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
26 <param name="input" value="4.fasta" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
27 <param name="descr_columns" value="1"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
28 <param name="keep_first" value="0"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
29 <output name="output" file="fasta_to_tabular_out2.tabular" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
30 </test> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
31 |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
32 <test> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
33 <param name="input" value="454.fasta" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
34 <param name="descr_columns" value="1"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
35 <param name="keep_first" value="14"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
36 <output name="output" file="fasta_to_tabular_out3.tabular" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
37 </test> |
0 | 38 |
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
39 <test> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
40 <param name="input" value="454.fasta" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
41 <param name="descr_columns" value="2"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
42 <param name="keep_first" value="0"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
43 <output name="output" file="fasta_to_tabular_out4.tabular" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
44 </test> |
0 | 45 |
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
46 <test> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
47 <param name="input" value="454.fasta" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
48 <param name="descr_columns" value="5"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
49 <param name="keep_first" value="0"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
50 <output name="output" file="fasta_to_tabular_out5.tabular" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
51 </test> |
0 | 52 |
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
53 <test> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
54 <param name="input" value="454.fasta" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
55 <param name="descr_columns" value="5"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
56 <param name="keep_first" value="10"/> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
57 <output name="output" file="fasta_to_tabular_out6.tabular" /> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
58 </test> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
59 |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
60 </tests> |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
61 <help><![CDATA[ |
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
62 |
0 | 63 **What it does** |
64 | |
65 This tool converts FASTA formatted sequences to TAB-delimited format. | |
66 | |
67 Many tools consider the first word of the FASTA ">" title line to be an identifier, and any remaining text to be a free form description. | |
68 It is therefore useful to split this text into two columns in Galaxy (identifier and any description) by setting **How many columns to divide title string into?** to **2**. | |
69 In some cases the description can be usefully broken up into more columns -- see the examples . | |
70 | |
71 The option *How many characters to keep?* allows to select a specified number of letters from the beginning of each FASTA entry. | |
72 With the introduction of the **How many columns to divide title string into?** option this setting is of limited use, but does still allow you to truncate the identifier. | |
73 | |
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
74 ----- |
0 | 75 |
76 **Example** | |
77 | |
78 Suppose you have the following FASTA formatted sequences from a Roche (454) FLX sequencing run:: | |
79 | |
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
80 >EYKX4VC02EQLO5 length=108 xy=1826_0455 region=2 run=R_2007_11_07_16_15_57_ |
0 | 81 TCCGCGCCGAGCATGCCCATCTTGGATTCCGGCGCGATGACCATCGCCCGCTCCACCACG |
82 TTCGGCCGGCCCTTCTCGTCGAGGAATGACACCAGCGCTTCGCCCACG | |
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
83 >EYKX4VC02D4GS2 length=60 xy=1573_3972 region=2 run=R_2007_11_07_16_15_57_ |
0 | 84 AATAAAACTAAATCAGCAAAGACTGGCAAATACTCACAGGCTTATACAATACAAATGTAA |
85 | |
86 Running this tool with the default settings will produce this (2 column output): | |
87 | |
88 ========================================================================== ======================================= | |
89 EYKX4VC02EQLO5 length=108 xy=1826_0455 region=2 run=R_2007_11_07_16_15_57_ TCCGCGCCGAGCATGCCCATCTTGGATTCCGGC...ACG | |
90 EYKX4VC02D4GS2 length=60 xy=1573_3972 region=2 run=R_2007_11_07_16_15_57_ AATAAAACTAAATCAGCAAAGACTGGCAAATAC...TAA | |
91 ========================================================================== ======================================= | |
92 | |
93 Having the full title line (the FASTA ">" line text) as a column is not always ideal. | |
94 | |
95 The **How many characters to keep?** option is useful if your identifiers are all the same length. | |
96 In this example the identifier is 14 characters, so setting **How many characters to keep?** to **14** (and leaving **How many columns to divide title string into?** as the default, **1**) will produce this (2 column output): | |
97 | |
98 ============== ======================================= | |
99 EYKX4VC02EQLO5 TCCGCGCCGAGCATGCCCATCTTGGATTCCGGC...ACG | |
100 EYKX4VC02D4GS2 AATAAAACTAAATCAGCAAAGACTGGCAAATAC...TAA | |
101 ============== ======================================= | |
102 | |
103 If however your FASTA file has identifiers of variable length, it is better to split the text into at least two columns. | |
104 Running this tool with **How many columns to divide title string into?** to **2** will produce this (3 column output): | |
105 | |
106 ============== =========================================================== ======================================= | |
107 EYKX4VC02EQLO5 length=108 xy=1826_0455 region=2 run=R_2007_11_07_16_15_57_ TCCGCGCCGAGCATGCCCATCTTGGATTCCGGC...ACG | |
108 EYKX4VC02D4GS2 length=60 xy=1573_3972 region=2 run=R_2007_11_07_16_15_57_ AATAAAACTAAATCAGCAAAGACTGGCAAATAC...TAA | |
109 ============== =========================================================== ======================================= | |
110 | |
111 Running this tool with **How many columns to divide title string into?** to **5** will produce this (5 column output): | |
112 | |
113 ============== ========== ============ ======== ========================== ======================================= | |
114 EYKX4VC02EQLO5 length=108 xy=1826_0455 region=2 run=R_2007_11_07_16_15_57_ TCCGCGCCGAGCATGCCCATCTTGGATTCCGGC...ACG | |
115 EYKX4VC02D4GS2 length=60 xy=1573_3972 region=2 run=R_2007_11_07_16_15_57_ AATAAAACTAAATCAGCAAAGACTGGCAAATAC...TAA | |
116 ============== ========== ============ ======== ========================== ======================================= | |
117 | |
118 Running this tool with **How many columns to divide title string into?** to **5** and **How many characters to keep?** to **10** will produce this (5 column output). | |
119 Notice that only the first column is truncated to 10 characters -- and be careful not to trim your sequence names too much (generally they should be unique): | |
120 | |
121 ========== ========== ============ ======== ========================== ======================================= | |
122 EYKX4VC02E length=108 xy=1826_0455 region=2 run=R_2007_11_07_16_15_57_ TCCGCGCCGAGCATGCCCATCTTGGATTCCGGC...ACG | |
123 EYKX4VC02D length=60 xy=1573_3972 region=2 run=R_2007_11_07_16_15_57_ AATAAAACTAAATCAGCAAAGACTGGCAAATAC...TAA | |
124 ========== ========== ============ ======== ========================== ======================================= | |
125 | |
126 Note the sequences have been truncated for display purposes in the above tables. | |
127 | |
2
ff4751ce764d
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fasta_to_tabular commit cd1ed08574b749eee2a3f6e6151dbb0c8ca15bbf"
devteam
parents:
1
diff
changeset
|
128 ]]></help> |
0 | 129 </tool> |