|
18
|
1 <tool id="usearch_fastq_mergepairs" name="usearch fastq_mergepairs" version="0.0.2">
|
|
2
|
2 <description>merging of paired reads</description>
|
|
|
3 <version_command>usearch -version</version_command>
|
|
12
|
4 <command interpreter='bash'>usearch_wrapper.sh
|
|
|
5 usearch
|
|
|
6 -quiet
|
|
7
|
7 -fastq_mergepairs '$input_forward'
|
|
|
8 -reverse '$input_reverse'
|
|
17
|
9 #if $minovlen.value != 0
|
|
13
|
10 -fastq_minovlen $minovlen
|
|
7
|
11 #end if
|
|
22
|
12 #if $minmergelen.value != 0
|
|
|
13 -fastq_minmergelen $minmergelen
|
|
|
14 #end if
|
|
24
|
15 #if $maxmergelen.value != 0
|
|
|
16 -fastq_maxmergelen $maxmergelen
|
|
|
17 #end if
|
|
|
18 #if $maxdiffs.value != 0
|
|
|
19 -fastq_maxdiffs $maxdiffs
|
|
|
20 #end if
|
|
|
21 #if $truncqual.value != 0
|
|
|
22 -fastq_truncqual $truncqual
|
|
|
23 #end if
|
|
|
24 #if $minlen.value != 0
|
|
|
25 -fastq_minlen $minlen
|
|
|
26 #end if
|
|
25
|
27 $allowmergestagger
|
|
|
28 -fastq_ascii $ascii
|
|
|
29 -fastq_qmin $qmin
|
|
7
|
30 -fastq_qmax $qmax
|
|
25
|
31 -fastq_qmaxout $qmaxout
|
|
26
|
32 #if $output_format.format == "fastq"
|
|
|
33 -fastqout $output
|
|
|
34 #else
|
|
|
35 -fastaout $output
|
|
|
36 #end if
|
|
2
|
37 </command>
|
|
|
38 <inputs>
|
|
17
|
39 <!-- INPUT OPTIONS -->
|
|
27
|
40 <param name="input_forward" type="data" format="fastq,fastqsanger,fastqcssanger" label="1. File with forward reads" />
|
|
|
41 <param name="input_reverse" type="data" format="fastq,fastqsanger,fastqcssanger" label="2. File with reverse reads" />
|
|
|
42 <param name="minovlen" type="integer" value="0" label="3. Minimum length of the overlap" help="'0' means no minimum." />
|
|
|
43 <param name="minmergelen" type="integer" value="0" label="4. Minimum length of the merged read" help="'0' means no minimum." />
|
|
|
44 <param name="maxmergelen" type="integer" value="0" label="5. Maximum length of the merged read" help="'0' means no maximum." />
|
|
30
|
45 <param name="maxdiffs" type="integer" value="0" label="6. Maximum number of mismatches allowed in the overlap region" help="'0' means any number of mismatches allowed." />
|
|
|
46 <param name="truncqual" type="integer" value="0" label="7. Truncate the forward and reverse reads at the first Q that is equal or less than this value, if present"
|
|
29
|
47 help="'0' means no quality truncation. This truncation is performed before aligning the pair. With Illumina paired reads, it is recommended to set this to 2 or higher, as low-quality tails will otherwise often cause alignment of the pair to fail." />
|
|
28
|
48 <param name="minlen" type="integer" value="0" label="8. Minimum length of the forward and reverse read, after truncating per option 7 if applicable" help="'0' means no minimum." />
|
|
27
|
49 <param name="allowmergestagger" type="boolean" truevalue="-fastq_allowmergestagger" falsevalue="" checked="false" label="9. Allow merge of a pair where the alignment is staggered" help="By default, pairs with staggered alignments are discarded." />
|
|
|
50 <param name="ascii" type="integer" value="33" label="10. ASCII_BASE constant" help="See http://drive5.com/usearch/manual/fastq_params.html" />
|
|
|
51 <param name="qmin" type="integer" value="0" label="11. Minimum Q score" />
|
|
|
52 <param name="qmax" type="integer" value="41" label="12. Maximum Q score for input files" />
|
|
|
53 <param name="qmaxout" type="integer" value="41" label="13. Maximum Q score for output files" />
|
|
17
|
54
|
|
|
55 <!-- OUTPUT OPTIONS -->
|
|
|
56 <conditional name="output_format">
|
|
19
|
57 <param name="format" type="select" label="Output format">
|
|
|
58 <option value="fastq" selected="true">FASTQ</option>
|
|
17
|
59 <option value="fasta">FASTA</option>
|
|
|
60 </param>
|
|
|
61 <when value="fastq"></when>
|
|
|
62 <when value="fasta"></when>
|
|
|
63 </conditional>
|
|
|
64 </inputs>
|
|
2
|
65 <outputs>
|
|
28
|
66 <data format="fastq" name="output" label="Merge output">
|
|
|
67 <change_format>
|
|
|
68 <when input="format" value="fasta" format="fasta" />
|
|
|
69 </change_format>
|
|
|
70 </data>
|
|
2
|
71 </outputs>
|
|
|
72 <tests>
|
|
|
73 <test>
|
|
|
74 <param name="input_forward" value="fastq_mergepairs_input1.fq" ftype="fastqsanger" />
|
|
|
75 <param name="input_reverse" value="fastq_mergepairs_input2.fq" ftype="fastqsanger" />
|
|
5
|
76 <param name="qmax" value="65" />
|
|
2
|
77 <output name="output" file="fastq_mergepairs_output.fq" />
|
|
|
78 </test>
|
|
|
79 </tests>
|
|
|
80 <help>
|
|
|
81 **What it Does**
|
|
|
82
|
|
|
83 Performs merging of paired reads.
|
|
|
84
|
|
|
85 The FASTQ filename for the forward reads is specified by the -fastq_mergepairs option, and the reverse read filename is specified by the -reverse option. Output files are specified by -fastqout (for FASTQ) and / or -fastaout (for FASTA).
|
|
|
86
|
|
|
87 Forward and reverse must be in 1:1 correspondence and must appear in the same order in both files. The labels for the forward and reverse read in a given pair must be identical except for a single position where a '1' appears in the forward read label and a '2' appears in the reverse read label.
|
|
|
88
|
|
|
89 -----
|
|
|
90
|
|
|
91 **Input formats**
|
|
|
92
|
|
|
93 Forward read::
|
|
|
94
|
|
|
95 @IRIS:7:1:29:952#0/1
|
|
|
96 TGAGAAGCAAGAAGAAGGTTGGTTAGTGTTTTGGAG
|
|
|
97 +IRIS:7:1:29:952#0/1
|
|
|
98 aaabaaaaaaaaaaa`aaY`aa^aaa^a_a_`aa``
|
|
|
99
|
|
|
100 Reverse read::
|
|
|
101
|
|
|
102 @IRIS:7:1:29:952#0/2
|
|
|
103 GACTCCAAAACACTAACCAACCTTCTTCTTGCTTCT
|
|
|
104 +IRIS:7:1:29:952#0/2
|
|
|
105 aaaabaaaabaaaabbaaaa````__`__^__``__
|
|
|
106
|
|
|
107 -----
|
|
|
108
|
|
|
109 **Output**
|
|
|
110
|
|
|
111 A multiple-fastq file, for example::
|
|
|
112
|
|
|
113 @IRIS:7:1:29:952#0/1
|
|
|
114 TGAGAAGCAAGAAGAAGGTTGGTTAGTGTTTTGGAGTC
|
|
|
115 +
|
|
|
116 aaJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJJaa
|
|
|
117
|
|
|
118 ------
|
|
|
119
|
|
|
120 **Manual**
|
|
|
121
|
|
30
|
122 * USEARCH fastq_mergepairs command options: http://drive5.com/usearch/manual/fastq_mergepairs.html
|
|
|
123 * FASTQ format options: http://drive5.com/usearch/manual/fastq_params.html
|
|
2
|
124
|
|
|
125 **Citation**
|
|
|
126
|
|
|
127 Please cite one of these papers if you use USEARCH in published work.
|
|
|
128
|
|
|
129 Edgar,RC (2010) Search and clustering orders of magnitude faster than BLAST, Bioinformatics 26(19), 2460-2461.
|
|
|
130 doi: 10.1093/bioinformatics/btq461
|
|
|
131 </help>
|
|
|
132 </tool>
|