view macs2_filterdup.xml @ 0:9c157b556c33 draft

Uploaded
author iuc
date Thu, 16 Jan 2014 13:31:17 -0500
parents
children d202e3d663bb
line wrap: on
line source

<tool id="macs2_filterdup" name="Remove duplicate reads" version="2.0.10.0">
    <description>at the same position</description>
    <requirements>
        <requirement type="python-module">macs2</requirement>
        <requirement type="python-module">numpy</requirement>
        <requirement type="package" version="2.0.10.2">macs2</requirement>
        <requirement type="package" version="1.7.1">numpy</requirement>
    </requirements>
    <command>
        macs2 filterdup
            -t $infile
            -o $outfile

        --format '$ifile.extension.upper()'
        --gsize $gsize
        --tsize $tsize
        --pvalue $pvalue
        #if str( $keep_dup_options.keep_dup_options_selector ) == "user":
            --keep-dup $keep_dup_options.user_keepdup
        #else
            --keep-dup str( $keep_dup_options.keep_dup_options_selector )
        #end if
    </command>
    <inputs>

        <!--may need to add a few more formats at later time-->
        <param name="infile" type="data" format="sam,bam,bed" label="Sequencing alignment file" />
        <param name="gsize" type="float" label="Effective genome size" value="2.7e+9" help="Human: 3.3e+9, Mouse: 3.0e+9, Fly: 1.9e+8, Worm: 1.3e+8 (--gsize)" />
        <param name="tsize" type="float" label="Tag size" value="-1.0" help="This will overide the auto detected tag size. DEFAULT: Not set (-1.0)  (--tsize)" />
        <param name="pvalue" type="float" label="Pvalue cutoff for binomial distribution test" value="1e-5" help="default: 1e-5 (--pvalue)" />

        <conditional name="keep_dup_options">
            <param name="keep_dup_options_selector" type="select" label="controlling behavior of duplicate tags at the exact same location"
                help="It controls the 'macs2 filterdup' behavior towards duplicate tags at the exact same location (the same coordination and the same strand. The default 'auto') option makes 'macs2 filterdup' calculate the maximum tags at the exact same location based on binomal distribution using given -p as pvalue cutoff; and the 'all' option keeps every tags (useful if you only want to convert formats). If an integer is given, at most this number of tags will be kept at the same location. Default: auto">
                <option value="auto">auto</option>
                <option value="all">all</option>
                <option value="user">user defined</option>
            </param>
            <when value="user">
                <param name="user_keepdup" type="integer" label="Keep at most this number of tags" value="10"/>
            </when>
        </conditional>

    </inputs>
    <outputs>
        <data name="outfile" format="bed" label="${tool.name} on ${on_string}" />
  </outputs>
  <tests>
    <!--none yet for macs2-->
  </tests>
  <help>
**What it does**

Remove duplicate reads at the same position, then convert acceptable format to BED format.
filterdup tool from macs2
------

**Citation**

For the underlying tool, please cite Zhang Y, Liu T, Meyer CA, Eeckhoute J, Johnson DS, Bernstein BE, Nusbaum C, Myers RM, Brown M, Li W, Liu XS. Model-based analysis of ChIP-Seq (MACS). Genome Biol. 2008;9(9):R137.

Integration of MACS2 with Galaxy performed by Ziru Zhou ( ziruzhou@gmail.com ). Please send your comments/questions to modENCODE DCC at help@modencode.org.
  </help>
</tool>