Mercurial > repos > morinlab > lumpy
changeset 0:ec43f38f18c2 draft
Uploaded
author | morinlab |
---|---|
date | Sun, 04 Dec 2016 14:29:45 -0500 |
parents | |
children | f2d9c9f18d3f |
files | lumpy.xml |
diffstat | 1 files changed, 146 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/lumpy.xml Sun Dec 04 14:29:45 2016 -0500 @@ -0,0 +1,146 @@ +<tool id="lumpy" name="LUMPY" version="0.2.9"> + <description> + a probabilistic framework for structural variant discovery + </description> + <requirements> + <requirement type="package" version="0.1.19">samtools</requirement> + <requirement type="package" version="0.2.9">lumpy</requirement> + <requirement type="set_environment" version="0.2.9">LUMPY_SCRIPTS</requirement> + <requirement type="package" version="1.9">numpy</requirement> + </requirements> + <command> + + <!-- Create Symbolic links to bam and bam indexes --> + ln -s $normal normal.bam; + ln -s $normal.metadata.bam_index normal.bam.bai; + ln -s $tumour tumour.bam; + ln -s $tumour.metadata.bam_index tumour.bam.bai; + + <!-- EXTRACT DISCORDANT PAIRED END ALIGNMENTS --> + samtools view -F 1294 -b normal.bam | samtools sort - normal.pe; + samtools view -F 1294 -b tumour.bam | samtools sort - tumour.pe; + + <!-- EXTRACT SPLIT-READ ALIGNMENTS --> + samtools view -h normal.bam | + \$LUMPY_SCRIPTS/extractSplitReads_BwaMem -i stdin | + samtools view -Sb - | + samtools sort - normal.sr; + samtools view -h tumour.bam | + \$LUMPY_SCRIPTS/extractSplitReads_BwaMem -i stdin | + samtools view -Sb - | + samtools sort - tumour.sr; + + <!-- CREATE HISTO FILE --> + samtools view normal.bam | + tail -n+100000 | + \$LUMPY_SCRIPTS/pairend_distro.py -r 150 -X 4 -N 10000 -o normal.pe.histo > normal.stats; + samtools view tumour.bam | + tail -n+100000 | + \$LUMPY_SCRIPTS/pairend_distro.py -r 150 -X 4 -N 10000 -o tumour.pe.histo > tumour.stats; + + <!-- Store MEAN and STD in nice format --> + cat -t normal.stats | sed s/\\^\\I/,/g > normal.stats.txt; + cat -t tumour.stats | sed s/\\^\\I/,/g > tumour.stats.txt; + + <!-- RUN LUMPY --> + + lumpy + -e + -tt $advancedsettings.tt + -mw $advancedsettings.mw + #if $x + -x $x + #end if + + -pe + bam_file:normal.pe.sort.bam, + histo_file:normal.pe.histo, + \$(cat normal.stats.txt), + read_length:$advancedsettings.pe_read_length, + min_non_overlap:$advancedsettings.pe_min_non_overlap, + discordant_z:$advancedsettings.pe_discordant_z, + back_distance:$advancedsettings.pe_back_distance, + min_mapping_threshold:$advancedsettings.pe_min_mapping_threshold, + weight:$advancedsettings.pe_weight, + #if $sampleid_source.manual: + id:PE-$sampleid_source.idn + #else: + id:PE-\$(basename $normal) + #end if + + -sr + bam_file:normal.sr.sort.bam, + back_distance:$advancedsettings.sr_back_distance, + min_mapping_threshold:$advancedsettings.sr_min_mapping_threshold, + weight:$advancedsettings.sr_weight, + min_clip:$advancedsettings.sr_min_clip, + #if $sampleid_source.manual: + id:SE-$sampleid_source.idn + #else + id:SE-\$(basename $normal) + #end if + + -pe + bam_file:n=tumour.pe.sort.bam, + histo_file:tumour.pe.histo, + \$(cat tumour.stats.txt), + read_length:$advancedsettings.pe_read_length, + min_non_overlap:$advancedsettings.pe_min_non_overlap, + discordant_z:$advancedsettings.pe_discordant_z, + back_distance:$advancedsettings.pe_back_distance, + min_mapping_threshold:$advancedsettings.pe_min_mapping_threshold, + weight:$advancedsettings.pe_weight, + #if $sampleid_source.manual: + id:PE-$sampleid_source.idt + #else: + id:PE-\$(basename $tumour) + #end if + + -sr + bam_file:tumour.sr.sort.bam, + back_distance:$advancedsettings.sr_back_distance, + min_mapping_threshold:$advancedsettings.sr_min_mapping_threshold, + weight:$advancedsettings.sr_weight, + min_clip:$advancedsettings.sr_min_clip, + #if $sampleid_source.manual: + id:SE-$sampleid_source.idt + #else + id:SE-\$(basename $tumour) + #end if + + > $outfile; + + </command> + <inputs> + <conditional name="sampleid_source"> + <param label="Choose the source to fetch Sample Identifiers" name="sampleid_selector" type="select"> + <option value="bamfile">BAM File Name</option> + <option value="manual">Manual</option> + </param> + <when value="manual"> + <param name="idn" type="text" label="Tumour ID (Name)"/> + <param name="idt" type="text" label="Normal ID (Name)"/> + </when> + </conditional> + <param type="data" format="bam" name="normal" label="Normal Alignment File"/> + <param type="data" format="bam" name="tumour" label="Tumour Alignment File"/> + <param type="data" format="bed" name="x" label="Exluded Regions BED file" optional="true"/> + <section name="advancedsettings" title="Advanced Settings" expanded="false"> + <param type="integer" value="5" name="mw" label="Minimum Weight for Call"/> + <param type="integer" value="3" name="tt" label="Trim Threshold"/> + <param type="integer" name="pe_back_distance" value="20" label="Paired End Back Distance" help="Distance into the read to add the breakpoint interval"/> + <param type="integer" name="pe_min_mapping_threshold" value="1" label="Paired End Min Mapping Threshold" help="Minimum mapping quality that a read must have to be considered"/> + <param type="integer" name="pe_weight" value="1" label="Paired End Weight" help="Weight of each piece of evidence from this sample"/> + <param type="integer" name="pe_discordant_z" value="4" label="Paired End Discordant Value" help="Number of standard deviations away from the mean to be considered as a normal library size"/> + <param type="integer" name="pe_read_length" value="150" label="Paired End Read Length" help="Length of sequenced reads"/> + <param type="integer" name="pe_min_non_overlap" value="150" label="Paired End Min Non Overlap" help="Number of base pair positions that must be unique to each end of a read pair"/> + <param type="integer" name="sr_back_distance" value="20" label="Split Read Back Distance" help="Distance into the read to add the breakpoint interval"/> + <param type="integer" name="sr_min_mapping_threshold" value="1" label="Split Read Min Mapping Threshold" help="Minimum mapping quality that a read must have to be considered"/> + <param type="integer" name="sr_weight" value="1" label="Split Read Weight" help="Weight of each piece of evidence from this sample"/> + <param type="integer" name="sr_min_clip" value="1" label="Spliy Read Min Clip" help="Minimum number of clipped bases to consider in a split read"/> + </section> + </inputs> + <outputs> + <data type="vcf" name="outfile"/> + </outputs> +</tool> \ No newline at end of file