# HG changeset patch # User devteam # Date 1393302627 18000 # Node ID 7ea806787cf683279ed7b5523ea61ea52fee614a # Parent 0cab05ac1cbdb7e4a2fc8d76815f4a47b3a3b94c Uploaded diff -r 0cab05ac1cbd -r 7ea806787cf6 picard_InsertSizeMetrics.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/picard_InsertSizeMetrics.xml Mon Feb 24 23:30:27 2014 -0500 @@ -0,0 +1,97 @@ + + for PAIRED data + picard + + picard_wrapper.py -i "${input_file}" -n "${out_prefix}" --tmpdir "${__new_file_path__}" --deviations "${deviations}" + --histwidth "${histWidth}" --minpct "${minPct}" --malevel "${malevel}" + -j "\$JAVA_JAR_PATH/CollectInsertSizeMetrics.jar" -d "${html_file.files_path}" -t "${html_file}" + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +.. class:: infomark + +**Purpose** + +Reads a SAM or BAM file and describes the distribution +of insert size (excluding duplicates) with metrics and a histogram plot. + +**Picard documentation** + +This is a Galaxy wrapper for CollectInsertSizeMetrics, a part of the external package Picard-tools_. + + .. _Picard-tools: http://www.google.com/search?q=picard+samtools + +.. class:: warningmark + +**Useful for paired data only** + +This tool works for paired data only and can be expected to fail for single end data. + +----- + +.. class:: infomark + +**Inputs, outputs, and parameters** + +Picard documentation says (reformatted for Galaxy): + +.. csv-table:: + :header-rows: 1 + + Option,Description + "INPUT=File","SAM or BAM file Required." + "OUTPUT=File","File to write insert size metrics to Required." + "HISTOGRAM_FILE=File","File to write insert size histogram chart to Required." + "TAIL_LIMIT=Integer","When calculating mean and stdev stop when the bins in the tail of the distribution contain fewer than mode/TAIL_LIMIT items. This also limits how much data goes into each data category of the histogram." + "HISTOGRAM_WIDTH=Integer","Explicitly sets the histogram width, overriding the TAIL_LIMIT option. Also, when calculating mean and stdev, only bins LE HISTOGRAM_WIDTH will be included. " + "MINIMUM_PCT=Float","When generating the histogram, discard any data categories (out of FR, TANDEM, RF) that have fewer than this percentage of overall reads. (Range: 0 to 1) Default value: 0.01." + "STOP_AFTER=Integer","Stop after processing N reads, mainly for debugging. Default value: 0." + "CREATE_MD5_FILE=Boolean","Whether to create an MD5 digest for any BAM files created. Default value: false." + +.. class:: warningmark + +**Warning on SAM/BAM quality** + +Many SAM/BAM files produced externally and uploaded to Galaxy do not fully conform to SAM/BAM specifications. Galaxy deals with this by using the **LENIENT** +flag when it runs Picard, which allows reads to be discarded if they're empty or don't map. This appears +to be the only way to deal with SAM/BAM that cannot be parsed. + + +