Mercurial > repos > devteam > fastq_to_tabular
comparison fastq_to_tabular.xml @ 3:a63d1aa8e829 draft
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/galaxy_sequence_utils/fastq_to_tabular commit f2582539542b33240234e8ea6093e25d0aee9b6a
author | devteam |
---|---|
date | Sat, 30 Sep 2017 13:53:46 -0400 |
parents | 81c9b58760ff |
children | 672ad99bbfe4 |
comparison
equal
deleted
inserted
replaced
2:9616277d3d39 | 3:a63d1aa8e829 |
---|---|
1 <tool id="fastq_to_tabular" name="FASTQ to Tabular" version="1.1.0"> | 1 <tool id="fastq_to_tabular" name="FASTQ to Tabular" version="1.1.1"> |
2 <description>converter</description> | 2 <description>converter</description> |
3 <requirements> | 3 <requirements> |
4 <requirement type="package" version="1.0.0">galaxy_sequence_utils</requirement> | 4 <requirement type="package" version="1.1.1">galaxy_sequence_utils</requirement> |
5 </requirements> | 5 </requirements> |
6 <command interpreter="python">fastq_to_tabular.py '$input_file' '$output_file' $descr_columns '${input_file.extension[len( 'fastq' ):]}'</command> | 6 <command><![CDATA[ |
7 <inputs> | 7 gx-fastq-to-tabular '$input_file' '$output_file' $descr_columns '${input_file.extension[len('fastq'):]}' |
8 <param name="input_file" type="data" format="fastqsanger,fastqcssanger,fastqillumina,fastqsolexa" label="FASTQ file to convert" /> | 8 ]]></command> |
9 <param name="descr_columns" type="integer" value="1" label="How many columns to divide title string into?" help="Typically 2 to take the ID (first word) and decription (rest) as two columns, or 1 to give a single column"> | 9 <inputs> |
10 <validator type="in_range" min="1" /> | 10 <param name="input_file" type="data" format="fastqsanger,fastqcssanger,fastqillumina,fastqsolexa,fastqsanger.gz,fastqcssanger.gz,fastqillumina.gz,fastqsolexa.gz,fastqsanger.bz2,fastqcssanger.bz2,fastqillumina.bz2,fastqsolexa.bz2" label="FASTQ file to convert" /> |
11 </param> | 11 <param name="descr_columns" type="integer" min="1" value="1" label="How many columns to divide title string into?" help="Typically 2 to take the ID (first word) and decription (rest) as two columns, or 1 to give a single column" /> |
12 </inputs> | 12 </inputs> |
13 <outputs> | 13 <outputs> |
14 <data name="output_file" format="tabular" /> | 14 <data name="output_file" format="tabular" /> |
15 </outputs> | 15 </outputs> |
16 <tests> | 16 <tests> |
17 <!-- basic test --> | 17 <!-- basic test --> |
18 <test> | 18 <test> |
19 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger" /> | 19 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger" /> |
20 <param name="descr_columns" value="1"/> | 20 <param name="descr_columns" value="1"/> |
21 <output name="output_file" file="fastq_to_tabular_out_1.tabular" /> | 21 <output name="output_file" file="fastq_to_tabular_out_1.tabular" /> |
22 </test> | 22 </test> |
23 <!-- color space test --> | 23 <!-- compression test --> |
24 <test> | 24 <test> |
25 <param name="input_file" value="sanger_full_range_as_cssanger.fastqcssanger" ftype="fastqcssanger" /> | 25 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger.gz" ftype="fastqsanger.gz" /> |
26 <param name="descr_columns" value="1"/> | 26 <param name="descr_columns" value="1"/> |
27 <output name="output_file" file="fastq_to_tabular_out_2.tabular" /> | 27 <output name="output_file" file="fastq_to_tabular_out_1.tabular" /> |
28 </test> | 28 </test> |
29 <!-- split title into columns --> | 29 <!-- color space test --> |
30 <test> | 30 <test> |
31 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger" /> | 31 <param name="input_file" value="sanger_full_range_as_cssanger.fastqcssanger" ftype="fastqcssanger" /> |
32 <param name="descr_columns" value="2"/> | 32 <param name="descr_columns" value="1"/> |
33 <output name="output_file" file="fastq_to_tabular_out_3.tabular" /> | 33 <output name="output_file" file="fastq_to_tabular_out_2.tabular" /> |
34 </test> | 34 </test> |
35 </tests> | 35 <!-- split title into columns --> |
36 <help> | 36 <test> |
37 | 37 <param name="input_file" value="sanger_full_range_original_sanger.fastqsanger" ftype="fastqsanger" /> |
38 <param name="descr_columns" value="2"/> | |
39 <output name="output_file" file="fastq_to_tabular_out_3.tabular" /> | |
40 </test> | |
41 </tests> | |
42 <help><![CDATA[ | |
38 **What it does** | 43 **What it does** |
39 | 44 |
40 This tool converts FASTQ sequencing reads to a Tabular file. | 45 This tool converts FASTQ sequencing reads to a Tabular file. |
41 | 46 |
42 It is conventional to take the first word of the FASTQ "@" title line as the identifier, and any remaining text to be a free form description. | 47 It is conventional to take the first word of the FASTQ "@" title line as the identifier, and any remaining text to be a free form description. |
43 It is therefore often useful to split this text into two columns in Galaxy (identifier and any description) by setting **How many columns to divide title string into?** to **2**. | 48 It is therefore often useful to split this text into two columns in Galaxy (identifier and any description) by setting **How many columns to divide title string into?** to **2**. |
44 In some cases the description can be usefully broken up into more columns -- see the examples . | 49 In some cases the description can be usefully broken up into more columns -- see the examples . |
45 | 50 |
46 Tab characters, if present in the source FASTQ title, will be converted to spaces. | 51 Tab characters, if present in the source FASTQ title, will be converted to spaces. |
47 | 52 |
48 ----- | 53 ----- |
49 | 54 |
50 **Example** | 55 **Example** |
51 | 56 |
52 Consider the following two 454 reads in Sanger FASTQ format (using line wrapping for display, but do note not all tools will accept line wrapped FASTQ files):: | 57 Consider the following two 454 reads in Sanger FASTQ format (using line wrapping for display, but do note not all tools will accept line wrapped FASTQ files):: |
53 | 58 |
57 ttatttattccacaagcaggtttaaattttaaatttaaattattgcagaagactttaaattaacctcgttgtcggagtca | 62 ttatttattccacaagcaggtttaaattttaaatttaaattattgcagaagactttaaattaacctcgttgtcggagtca |
58 tttgttcggttattggtcgaaagtaaccncgggaagtgccgaaaactaacaaacaaaagaagatagtgaaattttaatta | 63 tttgttcggttattggtcgaaagtaaccncgggaagtgccgaaaactaacaaacaaaagaagatagtgaaattttaatta |
59 aaanaaatagccaaacgtaactaactaaaacggacccgtcgaggaactgccaacggacgacacagggagtagnnn | 64 aaanaaatagccaaacgtaactaactaaaacggacccgtcgaggaactgccaacggacgacacagggagtagnnn |
60 +FSRRS4401BE7HA [length=395] [gc=36.46] [flows=800] [phred_min=0] [phred_max=40] [trimmed_length=95] | 65 +FSRRS4401BE7HA [length=395] [gc=36.46] [flows=800] [phred_min=0] [phred_max=40] [trimmed_length=95] |
61 FFFDDDDDDDA666?688FFHGGIIIIIIIIIIIIIIIIIIHHHIIIIIIIIIGHGFFFFF====DFFFFFFFFFFFFFF | 66 FFFDDDDDDDA666?688FFHGGIIIIIIIIIIIIIIIIIIHHHIIIIIIIIIGHGFFFFF====DFFFFFFFFFFFFFF |
62 D???:3104/76=:5...4.3,,,366////4<ABBAAA=CCFDDDDDDDD:666CDFFFF=<ABA=;:333111<===9 | 67 D???:3104/76=:5...4.3,,,366////4<ABBAAA=CCFDDDDDDDD:666CDFFFF=<ABA=;:333111<===9 |
63 9;B889FFFFFFDDBDBDDD=8844231..,,,-,,,,,,,,1133..---17111,,,,,22555131121.--.,333 | 68 9;B889FFFFFFDDBDBDDD=8844231..,,,-,,,,,,,,1133..---17111,,,,,22555131121.--.,333 |
64 11,.,,3--,,.,,--,3511123..--!,,,,--,----9,,,,8=,,-,,,-,,,,---26:9:5-..1,,,,11//, | 69 11,.,,3--,,.,,--,3511123..--!,,,,--,----9,,,,8=,,-,,,-,,,,---26:9:5-..1,,,,11//, |
65 ,,,!,,1917--,,,,-3.,--,,17,,,,---+11113.030000,,,044400036;96662.//;7><;!!! | 70 ,,,!,,1917--,,,,-3.,--,,17,,,,---+11113.030000,,,044400036;96662.//;7><;!!! |
66 @FSRRS4401BRRTC [length=145] [gc=38.62] [flows=800] [phred_min=0] [phred_max=38] [trimmed_length=74] | 71 @FSRRS4401BRRTC [length=145] [gc=38.62] [flows=800] [phred_min=0] [phred_max=38] [trimmed_length=74] |
67 tcagCCAGCAATTCCGACTTAATTGTTCTTCTTCCATCATTCATCTCGACTAACAGTTCTACGATTAATGAGTTTGGCtt | 72 tcagCCAGCAATTCCGACTTAATTGTTCTTCTTCCATCATTCATCTCGACTAACAGTTCTACGATTAATGAGTTTGGCtt |
68 taatttgttgttcattattgtcacaattacactactgagactgccaaggcacncagggataggnn | 73 taatttgttgttcattattgtcacaattacactactgagactgccaaggcacncagggataggnn |
69 +FSRRS4401BRRTC [length=145] [gc=38.62] [flows=800] [phred_min=0] [phred_max=38] [trimmed_length=74] | 74 +FSRRS4401BRRTC [length=145] [gc=38.62] [flows=800] [phred_min=0] [phred_max=38] [trimmed_length=74] |
70 FFFFFFFFFDDDDFFFFGFDDDDBAAAAA=<4444@@B=555:BBBBB@@?8:8<?<89898<84442;==3,,,514,, | 75 FFFFFFFFFDDDDFFFFGFDDDDBAAAAA=<4444@@B=555:BBBBB@@?8:8<?<89898<84442;==3,,,514,, |
71 ,11,,,.,,21777555513,..--1115758.//34488><<;;;;9944/!/4,,,57855!! | 76 ,11,,,.,,21777555513,..--1115758.//34488><<;;;;9944/!/4,,,57855!! |
72 | 77 |
73 By default this is converted into a 3 column tabular file, with the full FASTQ title used as column 1: | 78 By default this is converted into a 3 column tabular file, with the full FASTQ title used as column 1: |
74 | 79 |
75 =================================================================================================== ============== ============== | 80 =================================================================================================== ============== ============== |
76 FSRRS4401BE7HA [length=395] [gc=36.46] [flows=800] [phred_min=0] [phred_max=40] [trimmed_length=95] tcagTTAA...nnn FFFDDDDD...!!! | 81 FSRRS4401BE7HA [length=395] [gc=36.46] [flows=800] [phred_min=0] [phred_max=40] [trimmed_length=95] tcagTTAA...nnn FFFDDDDD...!!! |
90 FSRRS4401BE7HA [length=395] [gc=36.46] [flows=800] [phred_min=0] [phred_max=40] [trimmed_length=95] tcagTTAA...nnn FFFDDDDD...!!! | 95 FSRRS4401BE7HA [length=395] [gc=36.46] [flows=800] [phred_min=0] [phred_max=40] [trimmed_length=95] tcagTTAA...nnn FFFDDDDD...!!! |
91 FSRRS4401BRRTC [length=145] [gc=38.62] [flows=800] [phred_min=0] [phred_max=38] [trimmed_length=74] tcagCCAG...gnn FFFFFFFF...5!! | 96 FSRRS4401BRRTC [length=145] [gc=38.62] [flows=800] [phred_min=0] [phred_max=38] [trimmed_length=74] tcagCCAG...gnn FFFFFFFF...5!! |
92 ============== ============ ========== =========== ============= ============== =================== ============== ============== | 97 ============== ============ ========== =========== ============= ============== =================== ============== ============== |
93 | 98 |
94 Note the sequences and quality strings have been truncated for display purposes in the above tables. | 99 Note the sequences and quality strings have been truncated for display purposes in the above tables. |
95 | 100 ]]></help> |
96 ------ | 101 <citations> |
97 | 102 <citation type="doi">10.1093/bioinformatics/btq281</citation> |
98 </help> | 103 </citations> |
99 | |
100 <citations> | |
101 <citation type="doi">10.1093/bioinformatics/btq281</citation> | |
102 </citations> | |
103 | |
104 </tool> | 104 </tool> |