# HG changeset patch # User bgruening # Date 1385735242 18000 # Node ID 0ad9733e22a43a7889eda29528b0c4bf33333183 # Parent eb394dd65c98852429ff3aa4269b8611aeeb24a1 Uploaded diff -r eb394dd65c98 -r 0ad9733e22a4 lib/galaxy/datatypes/snpeff.pyc Binary file lib/galaxy/datatypes/snpeff.pyc has changed diff -r eb394dd65c98 -r 0ad9733e22a4 snpEff.xml --- a/snpEff.xml Thu Nov 28 08:16:11 2013 -0600 +++ b/snpEff.xml Fri Nov 29 09:27:22 2013 -0500 @@ -1,72 +1,73 @@ Variant effect and annotation - - snpEff - + + + snpEff_macros.xml + -java -Xmx6G -jar \$SNPEFF_JAR_PATH/snpEff.jar eff --c \$SNPEFF_JAR_PATH/snpEff.config --i $inputFormat -o $outputFormat -upDownStreamLen $udLength -#if $spliceSiteSize and $spliceSiteSize.__str__ != '': - -spliceSiteSize $spliceSiteSize -#end if -#if $filterIn and $filterIn.__str__ != 'no_filter': - $filterIn -#end if -#if $filterHomHet and $filterHomHet.__str__ != 'no_filter': - $filterHomHet -#end if -#if $annotations and $annotations.__str__ != '': - #echo " " - #echo ' '.join($annotations.__str__.split(',')) -#end if -#if $filterOut and $filterOut.__str__ != '': - #echo " " - #echo ' '.join($filterOut.__str__.split(',')) -#end if -#if str( $transcripts ) != 'None': - -onlyTr $transcripts -#end if -#if str( $intervals ) != 'None': ### fix this for multiple dataset input - -interval $intervals -#end if -#if $statsFile: - -stats $statsFile -#end if -#if $offset.__str__ != '': - ${offset} -#end if -#if $chr.__str__.strip() != '': - -chr "$chr" -#end if - $noLog -#if $snpDb.genomeSrc == 'cached': - -dataDir ${snpDb.genomeVersion.fields.path} - #if $snpDb.extra_annotations and $snpDb.extra_annotations.__str__ != '': - #echo " " - #echo ' '.join($snpDb.extra_annotations.__str__.split(',')) - #end if - #if $snpDb.regulation and $snpDb.regulation.__str__ != '': - -reg #echo ' -reg '.join($snpDb.regulation.__str__.split(','))# - #end if - $snpDb.genomeVersion -#elif $snpDb.genomeSrc == 'history': - -dataDir ${snpDb.snpeff_db.extra_files_path} - #if $snpDb.extra_annotations and $snpDb.extra_annotations.__str__ != '': - #set annotations = [' '] + $snpDb.extra_annotations.__str__.split(',') - #echo " " - #echo ' -'.join($annotations) - #end if - #if $snpDb.regulation and $snpDb.regulation.__str__ != '': - -reg #echo ' -reg '.join($snpDb.regulation.__str__.split(','))# - #end if - ${snpDb.snpeff_db.metadata.genome_version} -#else - -download - $snpDb.genome_version -#end if -$input > $snpeff_output - + java -Xmx6G -jar \$SNPEFF_JAR_PATH/snpEff.jar eff + -c \$SNPEFF_JAR_PATH/snpEff.config + -i $inputFormat -o $outputFormat -upDownStreamLen $udLength + #if $spliceSiteSize and $spliceSiteSize.__str__ != '': + -spliceSiteSize $spliceSiteSize + #end if + #if $filterIn and $filterIn.__str__ != 'no_filter': + $filterIn + #end if + #if $filterHomHet and $filterHomHet.__str__ != 'no_filter': + $filterHomHet + #end if + #if $annotations and $annotations.__str__ != '': + #echo " " + #echo ' '.join($annotations.__str__.split(',')) + #end if + #if $filterOut and $filterOut.__str__ != '': + #echo " " + #echo ' '.join($filterOut.__str__.split(',')) + #end if + #if str( $transcripts ) != 'None': + -onlyTr $transcripts + #end if + #if str( $intervals ) != 'None': ### fix this for multiple dataset input + -interval $intervals + #end if + #if $statsFile: + -stats $statsFile + #end if + #if $offset.__str__ != '': + ${offset} + #end if + #if $chr.__str__.strip() != '': + -chr "$chr" + #end if + $noLog + #if $snpDb.genomeSrc == 'cached': + -dataDir ${snpDb.genomeVersion.fields.path} + #if $snpDb.extra_annotations and $snpDb.extra_annotations.__str__ != '': + #echo " " + #echo ' '.join($snpDb.extra_annotations.__str__.split(',')) + #end if + #if $snpDb.regulation and $snpDb.regulation.__str__ != '': + -reg #echo ' -reg '.join($snpDb.regulation.__str__.split(','))# + #end if + $snpDb.genomeVersion + #elif $snpDb.genomeSrc == 'history': + -dataDir ${snpDb.snpeff_db.extra_files_path} + #if $snpDb.extra_annotations and $snpDb.extra_annotations.__str__ != '': + #set annotations = [' '] + $snpDb.extra_annotations.__str__.split(',') + #echo " " + #echo ' -'.join($annotations) + #end if + #if $snpDb.regulation and $snpDb.regulation.__str__ != '': + -reg #echo ' -reg '.join($snpDb.regulation.__str__.split(','))# + #end if + ${snpDb.snpeff_db.metadata.genome_version} + #else + -download + $snpDb.genome_version + #end if + $input > $snpeff_output + @@ -85,10 +86,10 @@ - - - - + + + + @@ -142,7 +143,7 @@ - + @@ -170,23 +171,23 @@ - - - - - - - - + + + + + + + + - + - - - - - + + + + + @@ -195,12 +196,11 @@ - - By default SnpEff simplifies all chromosome names. For instance 'chr1' is just '1'. - You can prepend any string you want to the chromosome name." - - ^\S*$ - + + By default SnpEff simplifies all chromosome names. For instance 'chr1' is just '1'. + You can prepend any string you want to the chromosome name. + + ^\S*$ @@ -214,15 +214,11 @@ - generate_stats == True - - - - + @@ -323,13 +319,9 @@ This tool calculate the effect of variants (SNPs/MNPs/Insertions) and deletions. -For details about this tool, please go to http://snpEff.sourceforge.net +@EXTERNAL_DOCUMENTATION@ -SnpEff citation: -"A program for annotating and predicting the effects of single nucleotide polymorphisms, SnpEff: SNPs in the genome of Drosophila melanogaster strain w1118; iso-2; iso-3.", Cingolani P, Platts A, Wang le L, Coon M, Nguyen T, Wang L, Land SJ, Lu X, Ruden DM. Fly (Austin). 2012 Apr-Jun;6(2):80-92. PMID: 22728672 [PubMed - in process] - -SnpSift citation: -"Using Drosophila melanogaster as a model for genotoxic chemical mutational studies with a new program, SnpSift", Cingolani, P., et. al., Frontiers in Genetics, 3, 2012. +@CITATION_SECTION@ diff -r eb394dd65c98 -r 0ad9733e22a4 snpEff_download.xml --- a/snpEff_download.xml Thu Nov 28 08:16:11 2013 -0600 +++ b/snpEff_download.xml Fri Nov 29 09:27:22 2013 -0500 @@ -1,14 +1,15 @@ Download a new database - - snpEff - + + + snpEff_macros.xml + echo $genomeVersion > $snpeff_db; java -jar \$SNPEFF_JAR_PATH/snpEff.jar download -c \$SNPEFF_JAR_PATH/snpEff.config -dataDir $snpeff_db.extra_files_path -v $genomeVersion > $logfile - + @@ -18,18 +19,12 @@ - - - - + -This tool downloads a SnpEff database into the users history for use by snpEff. +@EXTERNAL_DOCUMENTATION@ -For details about this tool, please go to http://snpEff.sourceforge.net - -Please cite: -"A program for annotating and predicting the effects of single nucleotide polymorphisms, SnpEff: SNPs in the genome of Drosophila melanogaster strain w1118; iso-2; iso-3.", Cingolani P, Platts A, Wang le L, Coon M, Nguyen T, Wang L, Land SJ, Lu X, Ruden DM. Fly (Austin). 2012 Apr-Jun;6(2):80-92. PMID: 22728672 [PubMed - in process] +@CITATION_SECTION@ diff -r eb394dd65c98 -r 0ad9733e22a4 snpEff_macros.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/snpEff_macros.xml Fri Nov 29 09:27:22 2013 -0500 @@ -0,0 +1,45 @@ + + + + snpEff + + + + + + + + + + + + + + + + + + + + + + + + +For details about this tool, please go to http://snpeff.sourceforge.net/SnpSift.html#intervals + + + ------ + +**Citation** + +For the underlying tool, please cite the following two publications: + +SnpEff citation: +"A program for annotating and predicting the effects of single nucleotide polymorphisms, SnpEff: SNPs in the genome of Drosophila melanogaster strain w1118; iso-2; iso-3.", Cingolani P, Platts A, Wang le L, Coon M, Nguyen T, Wang L, Land SJ, Lu X, Ruden DM. Fly (Austin). 2012 Apr-Jun;6(2):80-92. PMID: 22728672 [PubMed - in process] + +SnpSift citation: +"Using Drosophila melanogaster as a model for genotoxic chemical mutational studies with a new program, SnpSift", Cingolani, P., et. al., Frontiers in Genetics, 3, 2012. + + + diff -r eb394dd65c98 -r 0ad9733e22a4 snpSift_annotate.xml --- a/snpSift_annotate.xml Thu Nov 28 08:16:11 2013 -0600 +++ b/snpSift_annotate.xml Fri Nov 29 09:27:22 2013 -0500 @@ -1,13 +1,13 @@ - Annotate SNPs from dbSnp - - - snpEff - - + SNPs from dbSnp + + + + snpEff_macros.xml + + java -Xmx6G -jar \$SNPEFF_JAR_PATH/SnpSift.jar $annotate_cmd #if $annotate.id : -id @@ -15,55 +15,49 @@ -info "$annotate.info_ids" #end if -q $dbSnp $input > $output - - - - - - - - - - ^(([a-zA-Z][a-zA-Z0-9_-]*)(,[a-zA-Z][a-zA-Z0-9_-]*)*)?$ - - - - - - Allows unsorted VCF files, but it loads the entire 'database' VCF file into memory (which may not be practical for large 'database' VCF files). - Otherwise, both the database and the input VCF files should be sorted by position (Chromosome sort order can differ between files). - + + + + + + + + + + ^(([a-zA-Z][a-zA-Z0-9_-]*)(,[a-zA-Z][a-zA-Z0-9_-]*)*)?$ - - - - - - - - - - - - - - - - - - - - - - - + + + + + This option will load the entire 'database' VCF file into memory (which may not be practical for large 'database' VCF files). + Otherwise, both the database and the input VCF files should be sorted by position (Chromosome sort order can differ between files). + + + + + + + + + + + + + + + + + + + + + This is typically used to annotate IDs from dbSnp. -For details about this tool, please go to http://snpeff.sourceforge.net/SnpSift.html#annotate - Annotatating only the ID field from dbSnp137.vcf :: Input VCF: @@ -95,13 +89,11 @@ 22 16350245 rs2905295 C A 0.0 FAIL NS=192;RSPOS=16350245;GMAF=0.230804387568556;dbSNPBuildID=101;SSR=1;SAO=0;VP=050000000000000100000140;WGT=0;VC=SNV;GNO -SnpEff citation: -"A program for annotating and predicting the effects of single nucleotide polymorphisms, SnpEff: SNPs in the genome of Drosophila melanogaster strain w1118; iso-2; iso-3.", Cingolani P, Platts A, Wang le L, Coon M, Nguyen T, Wang L, Land SJ, Lu X, Ruden DM. Fly (Austin). 2012 Apr-Jun;6(2):80-92. PMID: 22728672 [PubMed - in process] +@EXTERNAL_DOCUMENTATION@ -SnpSift citation: -"Using Drosophila melanogaster as a model for genotoxic chemical mutational studies with a new program, SnpSift", Cingolani, P., et. al., Frontiers in Genetics, 3, 2012. +@CITATION_SECTION@ - + diff -r eb394dd65c98 -r 0ad9733e22a4 snpSift_caseControl.xml --- a/snpSift_caseControl.xml Thu Nov 28 08:16:11 2013 -0600 +++ b/snpSift_caseControl.xml Fri Nov 29 09:27:22 2013 -0500 @@ -1,13 +1,13 @@ - Count samples are in 'case' and 'control' groups. - - - snpEff - - + Count samples are in 'case' and 'control' groups. + + + + snpEff_macros.xml + + java -Xmx1G -jar \$SNPEFF_JAR_PATH/SnpSift.jar caseControl -q #if $name.__str__.strip() != '': -name $name @@ -18,79 +18,73 @@ -tfam "$ctrl.tfam" #end if $input > $output - - - - - - - - - - - - Case and control are defined by a string containing plus and minus symbols {'+', '-', '0'} where '+' is case, '-' is control and '0' is neutral - - [+-0]+ + + + + + + + - - - - - - - [_a-zA-Z0-9]+ - - - - - - - - - - + + + + Case and control are defined by a string containing plus and minus symbols {'+', '-', '0'} where '+' is case, '-' is control and '0' is neutral + + [+-0]+ + + + + + + + + [_a-zA-Z0-9]+ + + + + + + + + + + + + + + + + + + - - - - - - - - - - - + + + + + + + + + + + - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + **SnpSift CaseControl** @@ -119,15 +113,9 @@ - Case / Control column designation = ""++++------" -For details about this tool, please go to http://snpeff.sourceforge.net/SnpSift.html#casecontrol - -SnpEff citation: -"A program for annotating and predicting the effects of single nucleotide polymorphisms, SnpEff: SNPs in the genome of Drosophila melanogaster strain w1118; iso-2; iso-3.", Cingolani P, Platts A, Wang le L, Coon M, Nguyen T, Wang L, Land SJ, Lu X, Ruden DM. Fly (Austin). 2012 Apr-Jun;6(2):80-92. PMID: 22728672 [PubMed - in process] +@EXTERNAL_DOCUMENTATION@ -SnpSift citation: -"Using Drosophila melanogaster as a model for genotoxic chemical mutational studies with a new program, SnpSift", Cingolani, P., et. al., Frontiers in Genetics, 3, 2012. - - +@CITATION_SECTION@ diff -r eb394dd65c98 -r 0ad9733e22a4 snpSift_filter.xml --- a/snpSift_filter.xml Thu Nov 28 08:16:11 2013 -0600 +++ b/snpSift_filter.xml Fri Nov 29 09:27:22 2013 -0500 @@ -1,9 +1,10 @@ Filter variants using arbitrary expressions - - snpEff - + + + snpEff_macros.xml + java -Xmx6G -jar \$SNPEFF_JAR_PATH/SnpSift.jar filter -f $input -e $exprFile $inverse #if $filtering.mode == 'field': @@ -23,11 +24,11 @@ > $output - - - + + + - + @@ -56,13 +57,8 @@ - - - - - + - @@ -114,9 +110,7 @@ - - **SnpSift filter** @@ -146,14 +140,9 @@ * **isHom( GEN[0] ) & isVariant( GEN[0] ) & isRef( GEN[1] )** -For complete details about this tool and epressions that can be used, please go to http://snpeff.sourceforge.net/SnpSift.html#filter +@EXTERNAL_DOCUMENTATION@ -SnpEff citation: -"A program for annotating and predicting the effects of single nucleotide polymorphisms, SnpEff: SNPs in the genome of Drosophila melanogaster strain w1118; iso-2; iso-3.", Cingolani P, Platts A, Wang le L, Coon M, Nguyen T, Wang L, Land SJ, Lu X, Ruden DM. Fly (Austin). 2012 Apr-Jun;6(2):80-92. PMID: 22728672 [PubMed - in process] - -SnpSift citation: -"Using Drosophila melanogaster as a model for genotoxic chemical mutational studies with a new program, SnpSift", Cingolani, P., et. al., Frontiers in Genetics, 3, 2012. - +@CITATION_SECTION@ diff -r eb394dd65c98 -r 0ad9733e22a4 snpSift_int.xml --- a/snpSift_int.xml Thu Nov 28 08:16:11 2013 -0600 +++ b/snpSift_int.xml Fri Nov 29 09:27:22 2013 -0500 @@ -1,67 +1,56 @@ - Filter variants using intervals - - - snpEff - - - java -Xmx2G -jar \$SNPEFF_JAR_PATH/SnpSift.jar intervals -i $input $exclude $bedFile > $output - - - - - - - - - - - - - - + Filter variants using intervals + + + + snpEff_macros.xml + + + java -Xmx2G -jar \$SNPEFF_JAR_PATH/SnpSift.jar intervals -i $input $exclude $bedFile > $output + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + - - - - - - - - - - - +You can filter using intervals (BED file). + +@EXTERNAL_DOCUMENTATION@ - - - - - - - - - - - - - +@CITATION_SECTION@ - - -You can filter using intervals (BED file) - -For details about this tool, please go to http://snpeff.sourceforge.net/SnpSift.html#intervals - -SnpEff citation: -"A program for annotating and predicting the effects of single nucleotide polymorphisms, SnpEff: SNPs in the genome of Drosophila melanogaster strain w1118; iso-2; iso-3.", Cingolani P, Platts A, Wang le L, Coon M, Nguyen T, Wang L, Land SJ, Lu X, Ruden DM. Fly (Austin). 2012 Apr-Jun;6(2):80-92. PMID: 22728672 [PubMed - in process] - -SnpSift citation: -"Using Drosophila melanogaster as a model for genotoxic chemical mutational studies with a new program, SnpSift", Cingolani, P., et. al., Frontiers in Genetics, 3, 2012. - - +