# HG changeset patch # User mahtabm # Date 1365664542 -36000 # Node ID a5976b2dce6fbef1907b6fdda888010e62b513ac # Parent 1f6dce3d34e06d84b04e117b23f3d067423d8343 changing defualt values for ensembl database diff -r 1f6dce3d34e0 -r a5976b2dce6f variant_effect_predictor/variant_effect_predictor.xml --- a/variant_effect_predictor/variant_effect_predictor.xml Thu Apr 11 02:01:53 2013 -0400 +++ b/variant_effect_predictor/variant_effect_predictor.xml Thu Apr 11 17:15:42 2013 +1000 @@ -1,7 +1,7 @@ to annotate variants using an ENSEMBL database - variant_effect_predictor.pl -i=$input -o=$output -species=$species + variant_effect_predictor.pl -i=$input -o=$output -species=$species --sift b --polyphen b #if $database_options.database_options_selector == "advanced" --host=$database_options.host --user=$database_options.username --port=$database_options.portnum #if $database_options.password @@ -9,103 +9,26 @@ #end if #else ## hardcoded default values - bad? - --host=www.ebi.edu.au --user=anonymous --port=3306 - #end if - #if $parameters.everything - --everything - #else - #if $parameters.sift_options.sift - --sift $parameters.sift_options.sift_value.value - #end if - #if $parameters.polyphen_options.polyphen - --polyphen $parameters.polyphen_options.polyphen_value.value - #end if - #if $parameters.ccds - --ccds - #end if - #if $parameters.hgvs - --hgvs - #end if - #if $parameters.hgnc - --hgnc - #end if - #if $parameters.numbers - --numbers - #end if - #if $parameters.domains - --domains - #end if - #if $parameters.regulatory - --regulatory - #end if - #if $parameters.canonical - --canonical - #end if - #if $parameters.protein - --protein - #end if - #if $parameters.gmaf - --gmaf - #end if + --host=ensembldb.ensembl.org --user=anonymous --port=5306 #end if - + - + - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + @@ -114,64 +37,7 @@ -============ -Description -============ This tool connects to the ENSEMBL database using ENSEMBL's Variant Effect Predictor script and retrieves annotations for an input variants file. - -============ -Parameters -============ -everything - Shortcut flag to switch on all of the following: - ``sift b - polyphen b - ccds - hgvs - hgnc - numbers - domains - regulatory - cell_type - canonical - protein - gmaf`` - -sift [both|score|prediction term] - **Human only** SIFT predicts whether an amino acid substitution affects protein function based on sequence homology and the physical properties of amino acids. The VEP can output the prediction term, score or both. *Not used by default* - -polyphen [both|score|prediction term] - **Human only** PolyPhen is a tool which predicts possible impact of an amino acid substitution on the structure and function of a human protein using straightforward physical and comparative considerations. The VEP can output the prediction term, score or both. *Not used by default* - -ccds - Adds the CCDS transcript identifier (where available) to the output. *Not used by default* - -hgvs - Add HGVS nomenclature based on Ensembl stable identifiers to the output. Both coding and protein sequence names are added where appropriate. Currently it is not possible to generate HGVS identifiers from the cache; a database connection must be made. *Not used by default* - -hgnc - Adds the HGNC gene identifer (where available) to the output. *Not used by default* - -numbers - Adds affected exon and intron numbering to to output. Format is Number/Total. *Not used by default* - -domains - Adds names of overlapping protein domains to output. *Not used by default* - -regulatory - Look for overlaps with regulatory regions. The script can also call if a variant falls in a high information position within a transcription factor binding site. Output lines have a Feature type of RegulatoryFeature or MotifFeature. *Not used by default* - -cell_type - Report only regulatory regions that are found in the given cell type(s). Can be a single cell type or a comma-separated list. The functional type in each cell type is reported under CELL_TYPE in the output. To retrieve a list of cell types, use ``--cell_type list``. *Not used by default* - -canonical - Adds a flag indicating if the transcript is the canonical transcript for the gene. *Not used by default* - -protein - Add the Ensembl protein identifier to the output where appropriate. *Not used by default* - -gmaf - Add the global minor allele frequency (MAF) from 1000 Genomes Phase 1 data for any existing variant to the output. *Not used by default*