# HG changeset patch # User devteam # Date 1392613432 18000 # Node ID e5b4ed9e0dbda52020f5d083e3637128c016149f # Parent f53372fd8631f031d81edc6eba17343b8aa501c8 Uploaded diff -r f53372fd8631 -r e5b4ed9e0dbd picard_DownsampleSam.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/picard_DownsampleSam.xml Mon Feb 17 00:03:52 2014 -0500 @@ -0,0 +1,57 @@ + + + picard + + picard_wrapper.py + --input=$inputFile + --output=$outFile + --probability=$probability + --seed=$seed + -j "\$JAVA_JAR_PATH/DownsampleSam.jar" + + + + + + + + + + + + + + + + + + + + + +.. class:: infomark + +**Purpose** + +Randomly down-sample a SAM or BAM file to retain a random subset of the reads. Mate-pairs are either both kept or both discarded. Reads marked as not primary alignments are all discarded. Each read is given a probability P of being retained - results with the exact same input in the same order and with the same value for RANDOM_SEED will produce the same results. + +**Picard documentation** + +This is a Galaxy wrapper for DownsampleSam, a part of the external package Picard-tools_. + + .. _Picard-tools: http://www.google.com/search?q=picard+samtools + +------ + +.. class:: warningmark + +**Warning on SAM/BAM quality** + +Many SAM/BAM files produced externally and uploaded to Galaxy do not fully conform to SAM/BAM specifications. Galaxy deals with this by using the **LENIENT** +flag when it runs Picard, which allows reads to be discarded if they're empty or don't map. This appears +to be the only way to deal with SAM/BAM that cannot be parsed. + + + + \ No newline at end of file