# HG changeset patch # User elixir-it # Date 1530179925 14400 # Node ID 0cc081cd39922e1ccb9e6c412a77dd6c70d3e483 Uploaded diff -r 000000000000 -r 0cc081cd3992 mutect2.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mutect2.xml Thu Jun 28 05:58:45 2018 -0400 @@ -0,0 +1,312 @@ + + somatic SNP and indel caller + + mutect2_macros_add_loc.xml + + + gatk + picard + samtools + + + $log + #end if + + ##TODO gatk-register take the GenomeAnalysisTK-3.8-0-ge9d806836.tar.bz2 unzip it + ##and move the .jar file to \$CONDA_DEFAULT_ENV/opt/gatk-3.8/ then the mutect2 command is runned + gatk3-register \$_CONDA_DIR/../GenomeAnalysisTK-3.8-0-ge9d806836.tar.bz2 2>$log ; + java -jar \$CONDA_DEFAULT_ENV/opt/gatk-3.8/GenomeAnalysisTK.jar -nct \${GALAXY_SLOTS:-4} -T MuTect2 -I:tumor tumor.bam -I:normal normal.bam -o $output + #if $reference_source == "history" + -R genome.fa + #else + -R $reference_source.ref_file.fields.path + #end if + ## TODO advanced inputs section if the optional inputs are present their options are added to the command + #if $dbSNP + --dbsnp dbSNP.vcf + #end if + #if $cosmic + --cosmic cosmic.vcf + #end if + #if $list + -L position.bed + #end if + #if $alleles + --alleles alleles.vcf + #end if + + ##TODO advanced options section if the options inputs are different from the default value the option is added to the command + + #if str($advanced.advanced_parameters) =="show": + #if $advanced.heterozygosity != "0.001" + --heterozygosity $advanced.heterozygosity + #end if + #if $advanced.heterozygosity_stdev != "0.01" + --heterozygosity_stdev $advanced.heterozygosity_stdev + #end if + #if $advanced.indel_heterozygosity != "1.25E-4" + --indel_heterozygosity $advanced.indel_heterozygosity + #end if + #if $advanced.initial_normal_lod != "0.5" + --initial_normal_lod $advanced.initial_normal_lod + #end if + #if $advanced.initial_tumor_lod != "4.0" + --initial_tumor_lod $advanced.initial_tumor_lod + #end if + #if $advanced.max_alt_allele_in_normal_fraction != "0.03" + --max_alt_allele_in_normal_fraction $advanced.max_alt_allele_in_normal_fraction + #end if + #if $advanced.max_alt_alleles_in_normal_count != "1" + --max_alt_alleles_in_normal_count $advanced.max_alt_alleles_in_normal_count + #end if + #if $advanced.max_alt_alleles_in_normal_qscore_sum != "20" + --max_alt_alleles_in_normal_qscore_sum $advanced.max_alt_alleles_in_normal_qscore_sum + #end if + #if $advanced.maxReadsInRegionPerSample != "1000" + --maxReadsInRegionPerSample $advanced.maxReadsInRegionPerSample + #end if + #if $advanced.min_base_quality_score != "10" + --min_base_quality_score $advanced.min_base_quality_score + #end if + #if $advanced.minReadsPerAlignmentStart != "5" + --minReadsPerAlignmentStart $advanced.minReadsPerAlignmentStart + #end if + #if $advanced.normal_lod != "2.2" + --normal_lod $advanced.normal_lod + #end if + #if $advanced.pir_mad_threshold != "3.0" + --pir_mad_threshold $advanced.pir_mad_threshold + #end if + #if $advanced.pir_median_threshold != "10.0" + --pir_median_threshold $advanced.pir_median_threshold + #end if + #if $advanced.power_constant_qscore != "30" + --power_constant_qscore $advanced.power_constant_qscore + #end if + #if $advanced.sample_ploidy != "2" + --sample_ploidy $advanced.sample_ploidy + #end if + #if $advanced.standard_min_confidence_threshold_for_calling != "10.0" + --standard_min_confidence_threshold_for_calling $advanced.standard_min_confidence_threshold_for_calling + #end if + #if $advanced.tumor_lod != "6.3" + --tumor_lod $advanced.tumor_lod + #end if + #if $advanced.contamination_fraction_to_filter != "0.0" + --contamination_fraction_to_filter $contamination_fraction_to_filter + #end if + #if $advanced.dbsnp_normal_lod != "5.5" + --dbsnp_normal_lod $dbsnp_normal_lod + #end if + #if $advanced.debug_read_name != "" + --debug_read_name $debug_read_name + #end if + #if $advanced.genotyping_mode != "DISCOVERY" + --genotyping_mode $genotyping_mode + #end if + #if $advanced.group + --group $advanced.group + #end if + #end if + + ##TODO output section --> if the option string == "yes" the optional output is added + #if str($optional_out1.outFile1) =="yes" + --activeRegionOut $activeRegionOut_output + #end if + #if str($optional_out2.outFile2) =="yes" + --activityProfileOut $activityProfileOut_output + #end if + #if str($optional_out3.outFile3) =="yes" + --graphOutput $graphOutput_output + #end if + #if str($optional_out4.outFile4) =="yes" + --bamOutput $bamOutput_output + #end if + ##TODO the standard error is redirected to the log file + 2> $log + ]]> + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + optional_out1['outFile1'] == 'yes' + + + optional_out2['outFile2'] == 'yes' + + + optional_out3['outFile3'] == 'yes' + + + optional_out4['outFile4'] == 'yes' + + + + + + + + + + + + + + **IMPORTANT** to get the wrapper ready to start the admin user have to download gatk GATK 3.8-0-ge9d806836 from the broadinstitute site https://software.broadinstitute.org/gatk/download/archive and then move it in the conda_prefix folder + the path of the conda_prefix is written in the galaxy.ini(or .yml) file + + MuTect2 is a somatic SNP and indel caller that combines the DREAM challenge-winning somatic genotyping engine of the original MuTect (Cibulskis et al., 2013) with the assembly-based machinery of HaplotypeCaller. + Galaxy wrapper for MuTect2 implements most but not all options available through the command line. Supported options are described below. + + **Optional Inputs** + + + --alleles none Set of alleles to use in genotyping + + --cosmic [] VCF file of COSMIC sites + + --dbsnp none dbSNP file + + --activityProfileOut NA Output the raw activity profile results in IGV format + + --graphOutput NA Write debug assembly graph information to this file + + **Optional Parameters** + + + --contamination_fraction_to_filter 0.0 Fraction of contamination to aggressively remove + + --dbsnp_normal_lod 5.5 LOD threshold for calling normal non-variant at dbsnp sites + + --debug_read_name NA trace this read name through the calling process + + --genotyping_mode DISCOVERY Specifies how to determine the alternate alleles to use for genotyping + + --group [] One or more classes/groups of annotations to apply to variant calls + + --heterozygosity 0.001 Heterozygosity value used to compute prior likelihoods for any locus + + --heterozygosity_stdev 0.01 Standard deviation of eterozygosity for SNP and indel calling + + --indel_heterozygosity 1.25E-4 Heterozygosity for indel calling + + --initial_normal_lod 0.5 Initial LOD threshold for calling normal variant + + --initial_tumor_lod 4.0 Initial LOD threshold for calling tumor variant + + --max_alt_allele_in_normal_fraction 0.03 Threshold for maximum alternate allele fraction in normal + + --max_alt_alleles_in_normal_count 1 Threshold for maximum alternate allele counts in normal + + --max_alt_alleles_in_normal_qscore_sum 20 Threshold for maximum alternate allele quality score sum in normal + + --maxReadsInRegionPerSample 1000 Maximum reads in an active region + + --min_base_quality_score 10 Minimum base quality required to consider a base for calling + + --minReadsPerAlignmentStart 5 Minimum number of reads sharing the same alignment start for each genomic location in an active region + + --normal_lod 2.2 LOD threshold for calling normal non-germline + + --pir_mad_threshold 3.0 threshold for clustered read position artifact MAD + + --pir_median_threshold 10.0 threshold for clustered read position artifact median + + --power_constant_qscore 30 Phred scale quality score constant to use in power calculations + + --sample_ploidy 2 Ploidy per sample. For pooled data, set to (Number of samples in each pool * Sample Ploidy). + + --standard_min_confidence_threshold_for_calling 10.0 The minimum phred-scaled confidence threshold at which variants should be called + + --tumor_lod 6.3 LOD threshold for calling tumor variant + + **Advanced Outputs** + + + --bamOutput + + --activeRegionOut + + --activityProfileOut + + --graphOutput + + more information at https://software.broadinstitute.org/gatk/documentation/tooldocs/3.8-0/org_broadinstitute_gatk_tools_walkers_cancer_m2_MuTect2.php + + + 10.1038/nbt.2514 + +