diff dada2_derepFastq.xml @ 2:68a4233fd445 draft

planemo upload for repository https://github.com/bernt-matthias/mb-galaxy-tools/tree/topic/dada2/tools/dada2 commit 5b1603bbcd3f139cad5c876be83fcb39697b5613-dirty
author matthias
date Tue, 09 Apr 2019 07:02:20 -0400
parents 3f0bbe41052f
children d79b4d99b6de
line wrap: on
line diff
--- a/dada2_derepFastq.xml	Fri Mar 08 08:33:05 2019 -0500
+++ b/dada2_derepFastq.xml	Tue Apr 09 07:02:20 2019 -0400
@@ -1,4 +1,4 @@
-<tool id="dada2_derepFastq" name="dada2: derepFastq" version="@DADA2_VERSION@">
+<tool id="dada2_derepFastq" name="dada2: derepFastq" version="@DADA2_VERSION@+galaxy@WRAPPER_VERSION@">
     <description>dereplicate amplicon sequences</description>
     <macros>
         <import>macros.xml</import>
@@ -27,11 +27,31 @@
     <tests>
         <test>
             <param name="reads" value="filterAndTrim_single_F3D0_R1.fq.gz" ftype="fastqsanger.gz" />
-            <output name="output" value="derepFastq_single_F3D0_R1.table" ftype="dada2_derep" />
+            <output name="output" value="derepFastq_single_F3D0_R1.table" ftype="dada2_derep" >
+				<extra_files type="file" name="Rdata" value="derepFastq_single_F3D0_R1.Rdata" />
+            </output>
         </test>
     </tests>
     <help><![CDATA[
-        TODO: Fill in help.
+Description
+...........
+
+Dereplication combines all identical sequencing reads into into “unique sequences” with a corresponding “abundance” equal to the number of reads with that unique sequence. Dereplication substantially reduces computation time by eliminating redundant comparisons.
+
+Usage
+.....
+
+**Input** is a FASTQ dataset containing the filtered and trimmed reads of a sample. 
+
+**Output** a dataset with type *dada2_derep* which is a table that shows the 
+dereplicated sequences and their abundances.
+
+The output can be used as input for the *dada2: dada* tool which infers the sample composition from the dereplicated sequences given an error model. 
+
+Details
+.......
+
+Dereplication in the DADA2 pipeline has one crucial addition from other pipelines: DADA2 retains a summary of the quality information associated with each unique sequence. The consensus quality profile of a unique sequence is the average of the positional qualities from the dereplicated reads. These quality profiles inform the error model of the subsequent sample inference step, significantly increasing DADA2’s accuracy.
     ]]></help>
     <expand macro="citations"/>
 </tool>