# HG changeset patch # User elixir-it # Date 1541771594 18000 # Node ID c8dda64568274de8aeb1fe170a71c583e6b3dd1c # Parent 91abc25944cf2d04ef2d669b1a9bc449ec9c0300 Uploaded diff -r 91abc25944cf -r c8dda6456827 covacs_VariantRecalibrator.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/covacs_VariantRecalibrator.xml Fri Nov 09 08:53:14 2018 -0500 @@ -0,0 +1,223 @@ + + GATK VariantRecalibrator wrapper Version = 3.8 + + bed_macros.xml + vcf_macros.xml + + + gatk + + + $log + ]]> + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +.. class:: warningmark + +**IMPORTANT** to get the wrapper ready to start the admin user have to download gatk GATK version 3.8 from the broadinstitute site https://software.broadinstitute.org/gatk/download/archive and then move it in the conda_prefix folder, the path of the conda_prefix is written in the galaxy.ini(or .yml) file + + **more informations** at https://software.broadinstitute.org/gatk/documentation/tooldocs/3.8-0/org_broadinstitute_gatk_tools_walkers_variantrecalibration_VariantRecalibrator.php + +----- + +**Implemented options** VariantRecalibrator: + +**-L** : One or more genomic intervals over which to operate(file.bed) + +**-ip** Amount of padding (in bp) to add to each interval + +**--resource:NAME,known=true/false,training=true/false,truth=true/false,prior=float $file** :A list of sites for which to apply a prior probability of being correct but which aren't used by the algorithm (training and truth sets are required to run) + +**-mode** : Recalibration mode to employ (SNP|INDEL) + +**-an** : annotations which should used for calculations + +**-tranche** The levels of truth sensitivity at which to slice the data. (in percent, that is 1.0 for 1 percent) + +**in case of indels mode** + +**--minNumBadVariants** : Minimum number of bad variants + +**--maxGaussians** : Max number of Gaussians for the positive model + +**-mNG** : Max number of Gaussians for the negative model + +**OUTPUTS** + +-recalFile + +-tranchesFile + +----- + +.. class:: infomark + +**Recommended CoVaCS command** + +**-ip** 100 + +**-R** genome.fa + +**-input** VCF + +**-resource**:hapmap,known=false,training=true,truth=true,prior=15.0 hapmap.vcf + +**-resource**:omni,known=false,training=true,truth=true,prior=12.0 omni.vcf + +**-resource**:1000G,known=false,training=false,truth=false,prior=8.0 1000G.vcf + +**-resource**:dbsnp,known=true,training=false,truth=false,prior=2.0 dbsnp.vcf + +**-mode** SNP + +**-an** DP **-an** QD **-an** MQ **-an** MQRankSum **-an** ReadPosRankSum **-an** FS + +**-tranche** 100.0 **-tranche** 99.5 **-tranche** 99.0 **-tranche** 98.5 **-tranche** 90.0 + + + + 10.1186/s12864-018-4508-1 + + + diff -r 91abc25944cf -r c8dda6456827 mv_untar_gatk.sh --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mv_untar_gatk.sh Fri Nov 09 08:53:14 2018 -0500 @@ -0,0 +1,9 @@ +#!/bin/bash +#if the .jar file is not present in the conda_prefix the script search the tar.gz in the conda_prefix of the vm +#and untar the archive +if [[ ! -f $CONDA_PREFIX/../../GenomeAnalysisTK.jar ]] ; then + tar -zxvf $CONDA_PREFIX/../../GenomeAnalysis*.tar.gz -C $CONDA_PREFIX/../../ + +else + echo GATK is present +fi