view deseq2.xml @ 15:ff74cd9b0414 draft

Uploaded
author bgruening
date Thu, 05 Sep 2013 04:09:22 -0400
parents bb5c80d15e0a
children 1d2a02bc2208
line wrap: on
line source

<tool id="deseq2" name="DESeq2" version="2.0.1">
  <description>Determines differentially expressed transcripts from read alignments</description>
    <requirements>
        <requirement type="binary">Rscript</requirement>
        <requirement type="R-module">DESeq2</requirement>
        <requirement type="package" version="3.0.1">R_3_0_1</requirement>
        <requirement type="set_environment">DESEQ2_SCRIPT_PATH</requirement>
    </requirements>
    <command interpreter="Rscript">
        deseq2.R
            -o "$deseq_out"

            #if $pdf:
                -p "$plots"
            #end if

            -i "$input_matrix"

        #if $filter_sel.filter_sel_opts == 'all_vs_all':
            -s 'all_vs_all'
        #else:
            -s ## build a string like '1,2 5,6'
            "${filter_sel.control_cols} ${filter_sel.experiement_cols}"

            #set $temp_factor_list = list()
            #set $is_multi_factor_analysis = False
            #for $factor in $filter_sel.factor:
                #set $is_multi_factor_analysis = True
                $temp_factor_list.append( '%s:%s' % ($factor.factor_name.replace(' ','_'), $factor.factor_index) )
            #end for

            #if $is_multi_factor_analysis:
                -f "#echo ' '.join( $temp_factor_list )#"
            #end if
        #end if

    </command>
    <stdio>
        <regex match="Execution halted" 
           source="both" 
           level="fatal" 
           description="Execution halted." />
        <regex match="Input-Error 01" 
           source="both" 
           level="fatal" 
           description="Error in your input parameters: Make sure you only apply factors to selected samples." />
        <regex match="Error in" 
           source="both" 
           level="fatal" 
           description="An undefined error occured, please check your intput carefully and contact your administrator." />
    </stdio>
    <inputs>
        <param format="tabular" name="input_matrix" type="data" label="Countmatrix" help="You can create a count matrix with the tool ..."/>

         <conditional name="filter_sel">
            <param name="filter_sel_opts" type="select" label="Select properties to filter">
              <option value="all_vs_all">All against all</option>
              <option value="specific">specific</option>
            </param>
            <when value="specific">

                <param name="control_cols" label="Select columns containing treatment." type="data_column" data_ref="input_matrix"
                    numerical="True" multiple="true" use_header_names="true" size="120" display="checkboxes">
                    <validator type="no_options" message="Please select at least one column."/>
                </param>

                <param name="experiement_cols" label="Select columns containing treatment." type="data_column" data_ref="input_matrix"
                    numerical="True" multiple="true" use_header_names="true" size="120" display="checkboxes">
                    <validator type="no_options" message="Please select at least one column."/>
                </param>

                <repeat name="factor" title="Include multi-factor analysis">
                    <param name="factor_name" type="text" value="Factor Name" label="Specify a factor name" help=""/>

                    <param name="factor_index" label="Select columns that are associated with a factor." type="data_column" data_ref="input_matrix"
                        numerical="True" multiple="true" use_header_names="true" size="120" display="checkboxes">
                        <validator type="no_options" message="Please select at least one column."/>
                    </param>
                </repeat>

            </when>
            <when value="all_v_all" />
        </conditional>

        <param name="pdf" type="boolean" truevalue="" falsevalue="" checked="true" label="Visualising the analysis results"
            help="output an additional PDF file" />

    </inputs>

  <outputs>
    <data format="tabular" name="deseq_out" label="DESeq2 result file on ${on_string}"/>
    <data format="pdf" name="plots" label="DESeq2 plots on ${on_string}">
        <filter>pdf == True</filter>
    </data>
  </outputs>

  <help>

.. class:: infomark

**What it does** 

Estimate variance-mean dependence in count data from high-throughput sequencing assays and test for differential expression based on a model using the negative binomial distribution


**Inputs**

DESeq2_ requires one count matrix as input file. You can use the tool



**Output**

DESeq2_ generates a tabular file containing the different columns and optional visualized results as PDF.

====== ==========================================================
Column Description
------ ----------------------------------------------------------
     1 Sample ID (corresponds to the header in your count matrix)
     2 Gene Identifiers
     3 mean normalised counts, averaged over all samples from both conditions
     4 the logarithm (to basis 2) of the fold change
     5 standard error estimate for the log2 fold change estimate
     6 p value for the statistical significance of this change
     7 p value adjusted for multiple testing with the Benjamini-Hochberg procedure
       which controls false discovery rate (FDR)
====== ==========================================================


------

**References** 

DESeq2_ Authors: Michael Love (MPIMG Berlin), Simon Anders, Wolfgang Huber (EMBL Heidelberg)

If _DESeq2_ is used to obtain results for scientific publications it
should be cited as [1]_. A paper describing DESeq2_ is in preparation.



.. [1] Anders, S and Huber, W (2010): `Differential expression analysis for sequence count data`_. 

.. _Differential expression analysis for sequence count data: http://dx.doi.org/10.1186/gb-2010-11-10-r106
.. _DESeq2: http://master.bioconductor.org/packages/release/bioc/html/DESeq2.html


  </help>
</tool>