view bedtools-galaxy/intersectBed.xml @ 0:fa875e3c66c3 draft

Uploaded
author bgruening
date Wed, 02 Jan 2013 18:27:11 -0500
parents
children 3b3e7774f51a
line wrap: on
line source

<tool id="bedtools_intersectbed" name="Intersect interval files" version="0.2.0">
    <description>
    </description>
    <requirements>
        <requirement type="package" version="2.17.0_5e4507c54355a4a38c6d3e7497a2836a123c6655">bedtools</requirement>
    </requirements>

    <command>
        intersectBed
        #if $inputA.ext == "bam":
            -abam $inputA
        #else:
            -a $inputA
        #end if

        -b $inputB
        $split
        $strand
        #if str($fraction):
          -f $fraction
        #end if
        $reciprocal
        $invert
        $once
        $header
        $overlap_mode
        &gt; $output
    </command>

    <inputs>
        <param format="bed,bam" name="inputA" type="data" label="BED or BAM file"/>
        <param format="bed" name="inputB" type="data" label="overlap intervals in this BED file?"/>
        
        <param name="strand" type="select" label="Calculate coverage based on">
            <option value="">Overlaps on either strand</option>
            <option value="-s">Only overlaps occurring on the **same** strand.</option>
            <option value="-S">Only overlaps occurring on the **opposite** strand.</option>
        </param>

        <param name="overlap_mode" type="select" label="Calculate coverage based on">
            <option value="">Overlaps on either strand</option>
            <option value="-wa">Write the original entry in A for each overlap.</option>
            <option value="-wb">Write the original entry in B for each overlap. Useful for knowing what A overlaps. Restricted by the fraction- and reciprocal option.</option>
            <option value="-wo">Write the original A and B entries plus the number of base pairs of overlap between the two features. Only A features with overlap are reported. Restricted by the fraction- and reciprocal option.</option>
            <option value="-wao">Write the original A and B entries plus the number of base pairs of overlap between the two features. However, A features w/o overlap are also reported with a NULL B feature and overlap = 0. Restricted by the fraction- and reciprocal option.</option>
            <option value="-loj">Perform a "left outer join". That is, for each feature in A report each overlap with B.  If no overlaps are found, report a NULL feature for B.</option>
        </param>

        <param name="split" type="boolean" checked="true" truevalue="-split" falsevalue="" label="Treat split/spliced BAM or BED12 entries as distinct BED intervals when computing coverage." help="If set, the coverage will be calculated based the spliced intervals only. For BAM files, this inspects the CIGAR N operation to infer the blocks for computing coverage. For BED12 files, this inspects the BlockCount, BlockStarts, and BlockEnds fields (i.e., columns 10,11,12). If this option is not set, coverage will be calculated based on the interval's START/END coordinates, and would include introns in the case of RNAseq data." />
        <!-- -f -->
        <param name="fraction" type="text" optional="true" label="Minimum overlap required as a fraction of the BAM alignment" help="Alignments are only retained if the overlap with the an interval in the BED file comprises at least this fraction of the BAM alignment's length.  For example, to require that the overlap affects 50% of the BAM alignment, use 0.50"/>
        <!-- -r -->
        <param name="reciprocal" type="boolean" checked="false" truevalue="-r" falsevalue="" label="Require reciprocal overlap." help="If set, the overlap between the BAM alignment and the BED interval must affect the above fraction of both the alignment and the BED interval." />
        <!-- -v -->
        <param name="invert" type="boolean" checked="false" truevalue="-v" falsevalue="" label="Report only those alignments that **do not** overlap the BED file."/>
        <!-- -u -->
        <param name="once" type="boolean" checked="false" truevalue="-u" falsevalue="" label="Write the original A entry _once_ if _any_ overlaps found in B." help="Just report the fact >=1 hit was found." />
        <!-- -c -->
        <param name="count" type="boolean" checked="false" truevalue="-c" falsevalue="" label="For each entry in A, report the number of overlaps with B." help="Reports 0 for A entries that have no overlap with B." />
        <!-- -sorted	Use the "chromsweep" algorithm for sorted (-k1,1 -k2,2n) input -->

        <!-- header -->
        <param name="header" type="boolean" checked="false" truevalue="-header" falsevalue="" label="Print the header from the A file prior to results." />


    </inputs>

    <outputs>
        <data format_source="inputA" name="output" metadata_source="inputA" label="Intersection of ${inputA.name} and ${inputB.name}"/>
    </outputs>

<help>

**What it does**

This tool creates a new BAM alignment file based on alignments that overlap (or optionally, those that do not overlap) intervals in another BED file.  Example usage would be to cull a BAM file from an exome capture experiment to include on the "on-target" alignments. 

.. class:: infomark

Note that each BAM alignment is treated individually.  Therefore, if one end of a paired-end alignment overlaps an interval in the BED file, yet the other end does not, the output file will only include the overlapping end.

.. class:: infomark

Note that a BAM alignment will be sent to the output file **once** even if it overlaps more than one interval in the BED file.

.. class:: warningmark

This tool requires that `bedtools`__ has been installed on your system.

------

This tool is part of the `bedtools package`__ from the `Quinlan laboratory`__. If you use this tool, please cite `Quinlan AR, and Hall I.M. BEDTools: A flexible framework for comparing genomic features. Bioinformatics, 2010, 26, 6.`__

    .. __: http://code.google.com/p/bedtools/
    .. __: http://code.google.com/p/bedtools/
    .. __: http://cphg.virginia.edu/quinlan/
    .. __: http://bioinformatics.oxfordjournals.org/content/26/6/841.short

</help>
</tool>