view plotCorrelation.xml @ 2:c5634baf9bf9 draft

planemo upload for repository https://github.com/fidelram/deepTools/tree/master/galaxy/wrapper/ commit 4e5124484b42d4ffef76af4bd82a6feb67a5b829
author bgruening
date Fri, 18 Dec 2015 12:27:26 -0500
parents b0050909cf03
children e556e34fc12a
line wrap: on
line source

<tool id="deeptools_plot_correlation" name="plotCorrelation" version="@WRAPPER_VERSION@.0">
    <description>creates a heatmap of correlation scores between different samples </description>
    <macros>
        <token name="@BINARY@">plotCorrelation</token>
        <import>deepTools_macros.xml</import>
    </macros>
    <expand macro="requirements"/>
    <command>
<![CDATA[
        @BINARY@
            --corData "$corData"
            --plotFile "$outFileName"
            --corMethod "$corMethod"
            --whatToPlot "$whatToPlot"
            $skipZeros
            --plotFileFormat "$outFileFormat"
            $removeOutliers
            --outFileCorMatrix "$matrix"
            @HEATMAP_OPTIONS@

]]>
    </command>
    <inputs>
        <param name="corData" format="deeptools_coverage_matrix" type="data" label="Matrix file from the bamCorrelate tool"/>
        <expand macro="corMethod" />

        <param argument="--whatToPlot" type="select" label="Plotting type">
            <option value="heatmap" selected="True">Heatmap</option>
            <option value="scatterplot">Scatterplot</option>
        </param>

        <expand macro="skipZeros" />

        <expand macro="image_file_format" />

        <param argument="--removeOutliers" type="boolean"
            truevalue="--removeOutliers" falsevalue="" label="Remove regions with very large counts"
            help="If set, bins with very large counts are removed. Bins
                with abnormally high reads counts artificially
                increase pearson correlation; that's why, by default,
                bamCorrelate tries to remove outliers using the median
                absolute deviation (MAD) method applying a threshold
                of 200 to only consider extremely large deviations
                from the median. ENCODE blacklist page (https://sites.
                google.com/site/anshulkundaje/projects/blacklists)
                contains useful information about regions with
                unusually high counts."/>

        <param name="outFileCorMatrix" type="boolean" label="Save the matrix of values underlying the heatmap"/>
        <expand macro="heatmap_options" />

    </inputs>
    <outputs>
        <expand macro="output_image_file_format" />
        <data format="tabular" name="matrix" label="${tool.name} on ${on_string}: Correlation matrix">
            <filter>outFileCorMatrix is True</filter>
        </data>
    </outputs>
    <tests>
        <test>
            <param name="corData" value="bamCorrelate_result1.npz" ftype="deeptools_coverage_matrix" />
            <param name="outFileFormat" value="png" />
            <param name="outFileCorMatrix" value="True" />
            <output name="matrix" file="plotCorrelation_result1.tabular" ftype="tabular" />
            <output name="outFileName" file="plotCorrelation_result1.png" ftype="png" compare="sim_size" delta="100" />
        </test>
        <test>
            <param name="corData" value="bamCorrelate_result1.npz" ftype="deeptools_coverage_matrix" />
            <param name="outFileFormat" value="png" />
            <param name="whatToPlot" value="scatterplot" />
            <param name="removeOutliers" value="True" />
            <param name="plotTitle" value="Test Plot" />
            <output name="outFileName" file="plotCorrelation_result2.png" compare="sim_size" delta="100" />
        </test>
    </tests>
    <help>
<![CDATA[
**What it does**

This tools takes a compressed matrix of scores (such as read coverages) for a number of genomic regions
and different samples. It can visualize the correlation among samples as scatterplots or as 
heatmap of correlation coefficients. Further output files are optional.
The compressed input matrices are easily generated using the "bamCorrelate" and "bigwigCorrelate" modules of deeptools.


.. image:: $PATH_TO_IMAGES/QC_bamCorrelate_humanSamples.png
   :alt: Heatmap of RNA Polymerase II ChIP-seq


You can find more details on plotCorrelation here http://deeptools.readthedocs.org/en/release-1.6/content/tools/plotCorrelation.html


**Output files**:

- **correlation structure**: a scatterplot of all mutual correlations between all samples in matrix
- **diagnostic plot**: clustered heatmap displaying the values for each pair-wise correlation, see below for an example
- data matrix (optional): if you want to analyze or plot the correlation values using a different program, e.g. R, this matrix can be used

-----

@REFERENCES@
]]>
    </help>
    <expand macro="citations" />
</tool>