comparison dir_plugins/plugin_config.txt @ 0:e545d0a25ffe draft

Uploaded
author dvanzessen
date Mon, 15 Jul 2019 05:17:17 -0400
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:e545d0a25ffe
1 my $VEP_PLUGIN_CONFIG = {
2 "plugins" => [
3
4 ## PATHOGENICITY PREDICTIONS
5 ############################
6
7 # dbNSFP
8 # https://github.com/ensembl-variation/VEP_plugins/blob/master/dbNSFP.pm
9 # Requires tabix-indexed data file as first param
10 # Field names are listed below and rendered as a multi-selectable autocomplete text field
11 # Human, GRCh38 only (3.x), for GRCh37 use 2.9.x
12 {
13 "key" => "dbNSFP",
14 "label" => "dbNSFP",
15 "available" => 0,
16 "enabled" => 0,
17 "section" => "Pathogenicity predictions",
18 "helptip" => "dbNSFP provides pathogenicity predictions for missense variants from various algorithms",
19 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/dbNSFP.pm",
20 "requires_data" => 1,
21 "requires_install" => 1,
22 "params" => [
23 #"/path/to/dbNSFP3.5a.txt.gz",
24 "@*"
25 ],
26 "species" => [
27 "homo_sapiens"
28 ],
29 "form" => [
30 {
31 "name" => "dbNSFP_fields",
32 "label" => "Fields to include",
33 "helptip" => "Fields to fetch from dbNSFP; hold down the Ctrl (Windows) / Command (Mac) button to select multiple options",
34 "value" => "",
35 'type' => 'dropdown',
36 'multiple' => 1,
37 'style' => 'height:150px',
38 'required' => 1,
39 'notes' => 'Field descriptions in <a rel="external" href="https://drive.google.com/file/d/0B60wROKy6OqcNGJ2STJlMTJONk0/view">dbNSFP README</a>',
40 # "class" => "jquery-multiselect",
41 "values" => [
42 # "chr",
43 # "pos(1-based)",
44 # "ref",
45 # "alt",
46 # "aaref",
47 # "aaalt",
48 # "rs_dbSNP150",
49 # "hg19_chr",
50 # "hg19_pos(1-based)",
51 # "hg18_chr",
52 # "hg18_pos(1-based)",
53 # "genename",
54 # "cds_strand",
55 # "refcodon",
56 # "codonpos",
57 "codon_degeneracy",
58 "Ancestral_allele",
59 "AltaiNeandertal",
60 "Denisova",
61 # "Ensembl_geneid",
62 # "Ensembl_transcriptid",
63 # "Ensembl_proteinid",
64 # "aapos",
65 # "SIFT_score",
66 # "SIFT_converted_rankscore",
67 # "SIFT_pred",
68 # "Uniprot_acc_Polyphen2",
69 # "Uniprot_id_Polyphen2",
70 # "Uniprot_aapos_Polyphen2",
71 # "Polyphen2_HDIV_score",
72 # "Polyphen2_HDIV_rankscore",
73 # "Polyphen2_HDIV_pred",
74 # "Polyphen2_HVAR_score",
75 # "Polyphen2_HVAR_rankscore",
76 # "Polyphen2_HVAR_pred",
77 "LRT_score",
78 "LRT_converted_rankscore",
79 "LRT_pred",
80 "LRT_Omega",
81 "MutationTaster_score",
82 "MutationTaster_converted_rankscore",
83 "MutationTaster_pred",
84 "MutationTaster_model",
85 "MutationTaster_AAE",
86 "MutationAssessor_UniprotID",
87 "MutationAssessor_variant",
88 "MutationAssessor_score",
89 "MutationAssessor_score_rankscore",
90 "MutationAssessor_pred",
91 "FATHMM_score",
92 "FATHMM_converted_rankscore",
93 "FATHMM_pred",
94 "PROVEAN_score",
95 "PROVEAN_converted_rankscore",
96 "PROVEAN_pred",
97 "Transcript_id_VEST3",
98 "Transcript_var_VEST3",
99 "VEST3_score",
100 "VEST3_rankscore",
101 "MetaSVM_score",
102 "MetaSVM_rankscore",
103 "MetaSVM_pred",
104 "MetaLR_score",
105 "MetaLR_rankscore",
106 "MetaLR_pred",
107 "Reliability_index",
108 "M-CAP_score",
109 "M-CAP_rankscore",
110 "M-CAP_pred",
111 "REVEL_score",
112 "REVEL_rankscore",
113 "MutPred_score",
114 "MutPred_rankscore",
115 "MutPred_protID",
116 "MutPred_AAchange",
117 "MutPred_Top5features",
118 "CADD_raw",
119 "CADD_raw_rankscore",
120 "CADD_phred",
121 "DANN_score",
122 "DANN_rankscore",
123 "fathmm-MKL_coding_score",
124 "fathmm-MKL_coding_rankscore",
125 "fathmm-MKL_coding_pred",
126 "fathmm-MKL_coding_group",
127 "Eigen_coding_or_noncoding",
128 "Eigen-raw",
129 "Eigen-phred",
130 "Eigen-PC-raw",
131 "Eigen-PC-phred",
132 "Eigen-PC-raw_rankscore",
133 "GenoCanyon_score",
134 "GenoCanyon_score_rankscore",
135 "integrated_fitCons_score",
136 "integrated_fitCons_score_rankscore",
137 "integrated_confidence_value",
138 "GM12878_fitCons_score",
139 "GM12878_fitCons_score_rankscore",
140 "GM12878_confidence_value",
141 "H1-hESC_fitCons_score",
142 "H1-hESC_fitCons_score_rankscore",
143 "H1-hESC_confidence_value",
144 "HUVEC_fitCons_score",
145 "HUVEC_fitCons_score_rankscore",
146 "HUVEC_confidence_value",
147 "GERP++_NR",
148 "GERP++_RS",
149 "GERP++_RS_rankscore",
150 "phyloP100way_vertebrate",
151 "phyloP100way_vertebrate_rankscore",
152 "phyloP20way_mammalian",
153 "phyloP20way_mammalian_rankscore",
154 "phastCons100way_vertebrate",
155 "phastCons100way_vertebrate_rankscore",
156 "phastCons20way_mammalian",
157 "phastCons20way_mammalian_rankscore",
158 "SiPhy_29way_pi",
159 "SiPhy_29way_logOdds",
160 "SiPhy_29way_logOdds_rankscore",
161 "1000Gp3_AC",
162 "1000Gp3_AF",
163 "1000Gp3_AFR_AC",
164 "1000Gp3_AFR_AF",
165 "1000Gp3_EUR_AC",
166 "1000Gp3_EUR_AF",
167 "1000Gp3_AMR_AC",
168 "1000Gp3_AMR_AF",
169 "1000Gp3_EAS_AC",
170 "1000Gp3_EAS_AF",
171 "1000Gp3_SAS_AC",
172 "1000Gp3_SAS_AF",
173 "TWINSUK_AC",
174 "TWINSUK_AF",
175 "ALSPAC_AC",
176 "ALSPAC_AF",
177 "ESP6500_AA_AC",
178 "ESP6500_AA_AF",
179 "ESP6500_EA_AC",
180 "ESP6500_EA_AF",
181 "ExAC_AC",
182 "ExAC_AF",
183 "ExAC_Adj_AC",
184 "ExAC_Adj_AF",
185 "ExAC_AFR_AC",
186 "ExAC_AFR_AF",
187 "ExAC_AMR_AC",
188 "ExAC_AMR_AF",
189 "ExAC_EAS_AC",
190 "ExAC_EAS_AF",
191 "ExAC_FIN_AC",
192 "ExAC_FIN_AF",
193 "ExAC_NFE_AC",
194 "ExAC_NFE_AF",
195 "ExAC_SAS_AC",
196 "ExAC_SAS_AF",
197 "ExAC_nonTCGA_AC",
198 "ExAC_nonTCGA_AF",
199 "ExAC_nonTCGA_Adj_AC",
200 "ExAC_nonTCGA_Adj_AF",
201 "ExAC_nonTCGA_AFR_AC",
202 "ExAC_nonTCGA_AFR_AF",
203 "ExAC_nonTCGA_AMR_AC",
204 "ExAC_nonTCGA_AMR_AF",
205 "ExAC_nonTCGA_EAS_AC",
206 "ExAC_nonTCGA_EAS_AF",
207 "ExAC_nonTCGA_FIN_AC",
208 "ExAC_nonTCGA_FIN_AF",
209 "ExAC_nonTCGA_NFE_AC",
210 "ExAC_nonTCGA_NFE_AF",
211 "ExAC_nonTCGA_SAS_AC",
212 "ExAC_nonTCGA_SAS_AF",
213 "ExAC_nonpsych_AC",
214 "ExAC_nonpsych_AF",
215 "ExAC_nonpsych_Adj_AC",
216 "ExAC_nonpsych_Adj_AF",
217 "ExAC_nonpsych_AFR_AC",
218 "ExAC_nonpsych_AFR_AF",
219 "ExAC_nonpsych_AMR_AC",
220 "ExAC_nonpsych_AMR_AF",
221 "ExAC_nonpsych_EAS_AC",
222 "ExAC_nonpsych_EAS_AF",
223 "ExAC_nonpsych_FIN_AC",
224 "ExAC_nonpsych_FIN_AF",
225 "ExAC_nonpsych_NFE_AC",
226 "ExAC_nonpsych_NFE_AF",
227 "ExAC_nonpsych_SAS_AC",
228 "ExAC_nonpsych_SAS_AF",
229 "gnomAD_exomes_AC",
230 "gnomAD_exomes_AN",
231 "gnomAD_exomes_AF",
232 "gnomAD_exomes_AFR_AC",
233 "gnomAD_exomes_AFR_AN",
234 "gnomAD_exomes_AFR_AF",
235 "gnomAD_exomes_AMR_AC",
236 "gnomAD_exomes_AMR_AN",
237 "gnomAD_exomes_AMR_AF",
238 "gnomAD_exomes_ASJ_AC",
239 "gnomAD_exomes_ASJ_AN",
240 "gnomAD_exomes_ASJ_AF",
241 "gnomAD_exomes_EAS_AC",
242 "gnomAD_exomes_EAS_AN",
243 "gnomAD_exomes_EAS_AF",
244 "gnomAD_exomes_FIN_AC",
245 "gnomAD_exomes_FIN_AN",
246 "gnomAD_exomes_FIN_AF",
247 "gnomAD_exomes_NFE_AC",
248 "gnomAD_exomes_NFE_AN",
249 "gnomAD_exomes_NFE_AF",
250 "gnomAD_exomes_SAS_AC",
251 "gnomAD_exomes_SAS_AN",
252 "gnomAD_exomes_SAS_AF",
253 "gnomAD_exomes_OTH_AC",
254 "gnomAD_exomes_OTH_AN",
255 "gnomAD_exomes_OTH_AF",
256 "gnomAD_genomes_AC",
257 "gnomAD_genomes_AN",
258 "gnomAD_genomes_AF",
259 "gnomAD_genomes_AFR_AC",
260 "gnomAD_genomes_AFR_AN",
261 "gnomAD_genomes_AFR_AF",
262 "gnomAD_genomes_AMR_AC",
263 "gnomAD_genomes_AMR_AN",
264 "gnomAD_genomes_AMR_AF",
265 "gnomAD_genomes_ASJ_AC",
266 "gnomAD_genomes_ASJ_AN",
267 "gnomAD_genomes_ASJ_AF",
268 "gnomAD_genomes_EAS_AC",
269 "gnomAD_genomes_EAS_AN",
270 "gnomAD_genomes_EAS_AF",
271 "gnomAD_genomes_FIN_AC",
272 "gnomAD_genomes_FIN_AN",
273 "gnomAD_genomes_FIN_AF",
274 "gnomAD_genomes_NFE_AC",
275 "gnomAD_genomes_NFE_AN",
276 "gnomAD_genomes_NFE_AF",
277 "gnomAD_genomes_OTH_AC",
278 "gnomAD_genomes_OTH_AN",
279 "gnomAD_genomes_OTH_AF",
280 "clinvar_rs",
281 "clinvar_clnsig",
282 "clinvar_trait",
283 "clinvar_golden_stars",
284 "Interpro_domain",
285 "GTEx_V6p_gene",
286 "GTEx_V6p_tissue"
287 ],
288 },
289 ]
290 },
291
292 # CADD
293 # https://github.com/ensembl-variation/VEP_plugins/blob/master/CADD.pm
294 # Requires tabix-indexed data file as first param
295 # No other parameters so no form required
296 # data file currently only available for GRCh37
297 {
298 "key" => "CADD",
299 "label" => "CADD",
300 "available" => 0,
301 "enabled" => 0,
302 "section" => "Pathogenicity predictions",
303 "helptip" => "Combined Annotation Dependent Depletion (CADD) is a tool for scoring the deleteriousness of single nucleotide variants and insertion/deletion variants in the human genome. CADD integrates multiple annotations into one metric by contrasting variants that survived natural selection with simulated mutations.",
304 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/CADD.pm",
305 "requires_data" => 1,
306 "species" => [
307 "homo_sapiens"
308 ],
309 "params" => [
310 #"/path/to/whole_genome_SNVs.tsv.gz"
311 ]
312 },
313
314 # FATHMM-MKL
315 # https://github.com/ensembl-variation/VEP_plugins/blob/master/FATHMM_MKL.pm
316 # Requires tabix-indexed data file as first param
317 # No other parameters so no form required
318 # data file currently only available for GRCh37
319 {
320 "key" => "FATHMM_MKL",
321 "label" => "FATHMM-MKL",
322 "available" => 0,
323 "enabled" => 0,
324 "section" => "Pathogenicity predictions",
325 "helptip" => "FATHMM-MKL predicts functional consequences of variants, both coding and non-coding.",
326 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/FATHMM_MKL.pm",
327 "requires_data" => 1,
328 "species" => [
329 "homo_sapiens"
330 ],
331 "params" => [
332 #"/path/to/fathmm-MKL_Current.tab.gz"
333 ]
334 },
335
336 # GWAVA
337 # https://www.sanger.ac.uk/sanger/StatGen_Gwava
338 # Requires tabix-indexed BED data file from ftp://ftp.sanger.ac.uk/pub/resources/software/gwava/v1.0/VEP_plugin/
339 # data file currently only available for GRCh37
340 {
341 "key" => "Gwava",
342 "label" => "GWAVA",
343 "available" => 0,
344 "enabled" => 0,
345 "section" => "Pathogenicity predictions",
346 "helptip" => "Retrieves precomputed Genome Wide Annotation of VAriants (GWAVA) scores for any variant that overlaps a known variant from the Ensembl variation database",
347 "plugin_url" => "ftp://ftp.sanger.ac.uk/pub/resources/software/gwava/v1.0/VEP_plugin/Gwava.pm",
348 "requires_data" => 1,
349 "species" => [
350 "homo_sapiens"
351 ],
352 "params" => [
353 "@*",
354 # "/path/to/gwava_scores.bed.gz"
355 ],
356 "form" => [
357 {
358 "name" => "model",
359 "label" => "Model",
360 "type" => "dropdown",
361 "values" => [
362 { "value" => "region", "caption" => "Region" },
363 { "value" => "tss", "caption" => "TSS" },
364 { "value" => "unmatched", "caption" => "Unmatched" }
365 ],
366 "value" => "region",
367 },
368 ],
369 },
370
371 # Carol
372 # https://github.com/ensembl-variation/VEP_plugins/blob/master/Carol.pm
373 # Requires Math/CDF Perl module
374 {
375 "key" => "Carol",
376 "helptip" => "Calculates the Combined Annotation scoRing toOL (CAROL) score for a missense mutation based on the pre-calculated SIFT and PolyPhen scores",
377 "available" => 0,
378 "enabled" => 0,
379 "section" => "Pathogenicity predictions",
380 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/Carol.pm",
381 "requires_install" => 1,
382 "species" => [
383 "homo_sapiens"
384 ],
385 },
386
387 # Condel
388 # https://github.com/ensembl-variation/VEP_plugins/blob/master/Condel.pm
389 # Requires path to config directory as first param
390 # config directory is checked out as part of VEP_plugins repo, as /[path]/VEP_plugins/config/Condel/config
391 # Within that dir, edit condel_SP.conf so that condel.dir points to /[path]/VEP_plugins/config/Condel
392 {
393 "key" => "Condel",
394 "helptip" => "Calculates the Consensus Deleteriousness (Condel) score for a missense mutation based on the pre-calculated SIFT and PolyPhen scores",
395 "available" => 0,
396 "enabled" => 0,
397 "section" => "Pathogenicity predictions",
398 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/Condel.pm",
399 "requires_install" => 1,
400 "species" => [
401 "homo_sapiens"
402 ],
403 "params" => [
404 # "/path/to/config/Condel/config",
405 "@*"
406 ],
407 "form" => [
408 {
409 "name" => "score_pred",
410 "label" => "Score/prediction",
411 "type" => "dropdown",
412 "values" => [
413 { "value" => "b", "caption" => "Prediction and score" },
414 { "value" => "p", "caption" => "Prediction only" },
415 { "value" => "s", "caption" => "Score only" }
416 ],
417 "value" => "b",
418 },
419 ],
420 },
421
422 # LOFTEE
423 # See https://github.com/konradjk/loftee for details
424 {
425 "key" => "LoF",
426 "helptip" => "LOFTEE identifies LoF (loss-of-function) variation",
427 "available" => 0,
428 "enabled" => 0,
429 "section" => "Pathogenicity predictions",
430 "plugin_url" => "https://raw.githubusercontent.com/konradjk/loftee/master/LoF.pm",
431 "requires_data" => 1,
432 "requires_install" => 1,
433 "params" => [
434 "@*"
435 ]
436 },
437
438 # LoFtool
439 # Requires LoFtool_scores.txt file as first param (available in VEP_plugins GitHub repo)
440 {
441 "key" => "LoFtool",
442 "helptip" => "Provides a per-gene rank of genic intolerance and consequent susceptibility to disease based on the ratio of Loss-of-function (LoF) to synonymous mutations in ExAC data",
443 "available" => 0,
444 "enabled" => 0,
445 "section" => "Pathogenicity predictions",
446 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/LoFtool.pm",
447 "requires_data" => 1,
448 "species" => [
449 "homo_sapiens"
450 ],
451 "params" => [
452 # "/path/to/LoFtool_scores.txt"
453 ]
454 },
455
456 # ExACpLI
457 # Requires ExACpLI_values.txt file as first param (available in VEP_plugins GitHub repo)
458 {
459 "key" => "ExACpLI",
460 "helptip" => "Provides a per-gene probability of being loss-of-function intolerant (pLI) from ExAC data",
461 "available" => 0,
462 "enabled" => 0,
463 "section" => "Pathogenicity predictions",
464 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/ExACpLI.pm",
465 "requires_data" => 1,
466 "species" => [
467 "homo_sapiens"
468 ],
469 "params" => [
470 # "/path/to/ExACpLI_values.txt"
471 ]
472 },
473
474 # MPC
475 # Requires fordist_constraint_official_mpc_values.txt.gz data file
476 {
477 "key" => "MPC",
478 "helptip" => "MPC is a missense deleteriousness metric based on the analysis of genic regions depleted of missense mutations in ExAC",
479 "available" => 0,
480 "enabled" => 0,
481 "section" => "Pathogenicity predictions",
482 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/MPC.pm",
483 "requires_data" => 1,
484 "species" => [
485 "homo_sapiens"
486 ],
487 "params" => [
488 # "/path/to/fordist_constraint_official_mpc_values.txt.gz"
489 ]
490 },
491
492 # MTR
493 # Requires mtrflatfile_1.0.txt.gz data file from ftp://mtr-viewer.mdhs.unimelb.edu.au/pub
494 {
495 "key" => "MTR",
496 "helptip" => "MTR scores quantify the amount of purifying selection acting specifically on missense variants in a given window of protein-coding sequence",
497 "available" => 0,
498 "enabled" => 0,
499 "section" => "Pathogenicity predictions",
500 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/MTR.pm",
501 "requires_data" => 1,
502 "species" => [
503 "homo_sapiens"
504 ],
505 "params" => [
506 # "/path/to/mtrflatfile_1.0.txt.gz"
507 ]
508 },
509
510 # REVEL
511 # Requires data file processed from revel_all_chromosomes.csv.zip
512 {
513 "key" => "REVEL",
514 "helptip" => "An ensemble method for predicting the pathogenicity of rare missense variants",
515 "available" => 0,
516 "enabled" => 0,
517 "section" => "Pathogenicity predictions",
518 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/REVEL.pm",
519 "requires_data" => 1,
520 "species" => [
521 "homo_sapiens"
522 ],
523 "params" => [
524 # "/path/to/revel_all_chromosomes.tsv.gz"
525 ]
526 },
527
528
529
530 ## SPLICING PREDICTIONS
531 #######################
532
533 # dbscSNV
534 {
535 "key" => "dbscSNV",
536 "label" => "dbscSNV",
537 "available" => 0,
538 "enabled" => 0,
539 "section" => "Splicing predictions",
540 "helptip" => "Retrieves data for splicing variants from a tabix-indexed dbscSNV file",
541 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/dbscSNV.pm",
542 "requires_data" => 1,
543 "requires_install" => 1,
544 "params" => [
545 #"/path/to/dbscSNV1.1.txt.gz"
546 ],
547 "species" => [
548 "homo_sapiens"
549 ],
550 },
551
552 # GeneSplicer
553 {
554 "key" => "GeneSplicer",
555 "label" => "GeneSplicer",
556 "helptip" => "Detects splice sites in genomic DNA",
557 "available" => 0,
558 "enabled" => 0,
559 "section" => "Splicing predictions",
560 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/GeneSplicer.pm",
561 "requires_install" => 1,
562 "species" => [
563 "homo_sapiens"
564 ],
565 "params" => [
566 #"/path/to/genesplicer/bin/linux/genesplicer",
567 #"/path/to/genesplicer/human",
568 "@*"
569 ]
570 },
571
572 # MaxEntScan
573 {
574 "key" => "MaxEntScan",
575 "label" => "MaxEntScan",
576 "helptip" => "Sequence motif and maximum entropy based splice site consensus predictions",
577 "available" => 0,
578 "enabled" => 0,
579 "section" => "Splicing predictions",
580 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/MaxEntScan.pm",
581 "requires_install" => 1,
582 "species" => [
583 "homo_sapiens"
584 ],
585 "params" => [
586 #"/path/to/maxentscan"
587 ]
588 },
589
590 # SpliceRegion
591 {
592 "key" => "SpliceRegion",
593 "label" => "SpliceRegion",
594 "helptip" => "More granular predictions of splicing effects",
595 "available" => 0,
596 "enabled" => 0,
597 "section" => "Splicing predictions",
598 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/SpliceRegion.pm",
599 },
600
601
602 ## CONSERVATION
603 ###############
604
605 # Blosum62
606 {
607 "key" => "Blosum62",
608 "label" => "BLOSUM62",
609 "helptip" => "BLOSUM62 amino acid conservation score",
610 "available" => 0,
611 "enabled" => 0,
612 "section" => "Conservation",
613 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/Blosum62.pm",
614 },
615
616 # Conservation
617 # Use the following query to get valid species sets:
618 #
619 # SELECT group_concat(concat("_stt_", gd.name) SEPARATOR ' '), REPLACE(mlss.name, "Gerp Conservation Scores ", ""), sst.value
620 # FROM method_link ml,
621 # method_link_species_set mlss,
622 # genome_db gd, species_set ss, species_set_tag sst
623 # WHERE mlss.method_link_id = ml.method_link_id AND
624 # mlss.species_set_id = ss.species_set_id AND
625 # ss.genome_db_id = gd.genome_db_id AND
626 # ss.species_set_id = sst.species_set_id AND
627 # (ml.class = "ConservationScore.conservation_score")
628 # GROUP BY mlss.species_set_id
629 {
630 "key" => "Conservation",
631 "helptip" => "Retrieves a conservation score from the Ensembl Compara databases for variant positions",
632 "available" => 0,
633 "enabled" => 0,
634 "section" => "Conservation",
635 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/Conservation.pm",
636 "params" => [
637 "@*"
638 ],
639 "form" => [
640 {
641 "name" => "method_link_type",
642 "label" => "Method",
643 "type" => "dropdown",
644 "values" => [
645 { "value" => "GERP_CONSERVATION_SCORE", "caption" => "GERP"}
646 ]
647 },
648 {
649 "name" => "species_set",
650 "label" => "Species set",
651 "type" => "dropdown",
652 "values" => [
653 { "value" => "mammals", "caption" => "39 eutherian mammals" }, #"class" => "_stt_macaca_mulatta _stt_echinops_telfairi _stt_tupaia_belangeri _stt_erinaceus_europaeus _stt_sorex_araneus _stt_microcebus_murinus _stt_pongo_abelii _stt_equus_caballus _stt_ochotona_princeps _stt_cavia_porcellus _stt_choloepus_hoffmanni _stt_procavia_capensis _stt_tursiops_truncatus _stt_tarsius_syrichta _stt_dipodomys_ordii _stt_vicugna_pacos _stt_pteropus_vampyrus _stt_loxodonta_africana _stt_oryctolagus_cuniculus _stt_ailuropoda_melanoleuca _stt_nomascus_leucogenys _stt_callithrix_jacchus _stt_myotis_lucifugus _stt_bos_taurus _stt_gorilla_gorilla _stt_otolemur_garnettii _stt_pan_troglodytes _stt_ictidomys_tridecemlineatus _stt_sus_scrofa _stt_mus_musculus _stt_canis_familiaris _stt_mustela_putorius_furo _stt_felis_catus _stt_ovis_aries _stt_dasypus_novemcinctus _stt_homo_sapiens _stt_papio_anubis _stt_chlorocebus_sabaeus _stt_rattus_norvegicus" },
654 { "value" => "amniotes", "caption" => "23 amniota vertebrates" }, #"class" => "_stt_macaca_mulatta _stt_ornithorhynchus_anatinus _stt_monodelphis_domestica _stt_pongo_abelii _stt_equus_caballus _stt_taeniopygia_guttata _stt_oryctolagus_cuniculus _stt_anolis_carolinensis _stt_meleagris_gallopavo _stt_callithrix_jacchus _stt_bos_taurus _stt_gorilla_gorilla _stt_pan_troglodytes _stt_sus_scrofa _stt_mus_musculus _stt_canis_familiaris _stt_felis_catus _stt_gallus_gallus _stt_ovis_aries _stt_homo_sapiens _stt_papio_anubis _stt_chlorocebus_sabaeus _stt_rattus_norvegicus" },
655 { "value" => "sauropsids", "caption" => "7 sauropsids" }, #"class" => "_stt_taeniopygia_guttata _stt_anolis_carolinensis _stt_meleagris_gallopavo _stt_pelodiscus_sinensis _stt_gallus_gallus _stt_anas_platyrhynchos _stt_ficedula_albicollis" },
656 { "value" => "fish", "caption" => "11 fish" }, #"class" => "_stt_takifugu_rubripes _stt_gasterosteus_aculeatus _stt_oryzias_latipes _stt_tetraodon_nigroviridis _stt_gadus_morhua _stt_oreochromis_niloticus _stt_xiphophorus_maculatus _stt_astyanax_mexicanus _stt_lepisosteus_oculatus _stt_poecilia_formosa _stt_danio_rerio" },
657 ]
658 },
659 ]
660 },
661
662 # AncestralAllele
663 # Requires processed FASTA file from ftp://ftp.ensembl.org/pub/current_fasta/ancestral_alleles/
664 {
665 "key" => "AncestralAllele",
666 "label" => "Ancestral allele",
667 "helptip" => "Retrieves the ancestral allele for variants inferred from the Ensembl Compara Enredo-Pecan-Ortheus (EPO) pipeline",
668 "available" => 0,
669 "enabled" => 0,
670 "section" => "Conservation",
671 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/AncestralAllele.pm",
672 "requires_data" => 1,
673 "species" => [
674 "homo_sapiens"
675 ],
676 "params" => [
677 # "/path/to/homo_sapiens_ancestor_GRCh38_e93.fa.gz"
678 ]
679 },
680
681
682 ## FREQUENCY DATA
683 #################
684
685 # ExAC
686 {
687 "key" => "ExAC",
688 "label" => "ExAC frequencies",
689 "helptip" => "Reports allele frequencies from the Exome Aggregation Consortium",
690 "available" => 0,
691 "enabled" => 0,
692 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/ExAC.pm",
693 "section" => "Frequency data",
694 "requires_data" => 1,
695 "species" => [
696 "homo_sapiens"
697 ],
698 "params" => [
699 # "/path/to/ExAC.r0.3.sites.vep.vcf.gz"
700 ]
701 },
702
703
704 ## OTHER
705 ########
706
707 # CSN
708 {
709 "key" => "CSN",
710 "helptip" => "Reports Clinical Sequencing Nomenclature (CSN) for variants",
711 "available" => 0,
712 "enabled" => 0,
713 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/CSN.pm",
714 },
715
716 # miRNA
717 {
718 "key" => "miRNA",
719 "label" => "miRNA structure",
720 "helptip" => "Determines where in the secondary structure of a miRNA a variant falls",
721 "available" => 0,
722 "enabled" => 0,
723 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/miRNA.pm",
724 },
725
726
727
728 # NearestGene
729 {
730 "key" => "NearestGene",
731 "label" => "Nearest gene",
732 "helptip" => "Finds the nearest gene to non-genic variants",
733 "available" => 0,
734 "enabled" => 0,
735 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/NearestGene.pm",
736 },
737
738 # LD
739 {
740 "key" => "LD",
741 "label" => "Linkage disequilibrium",
742 "helptip" => "Finds variants in linkage disequilibrium with any overlapping existing variants from the Ensembl variation databases",
743 "available" => 0,
744 "enabled" => 0,
745 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/LD.pm",
746 "section" => "Variant data",
747 "params" => [
748 "@*"
749 ],
750 "form" => [
751 {
752 "name" => "population",
753 "label" => "Population",
754 "type" => "dropdown",
755 "values" => [
756 { "value" => "1000GENOMES:phase_3:ACB", "caption" => "African Caribbean in Barbados" },
757 { "value" => "1000GENOMES:phase_3:ASW", "caption" => "African Ancestry in Southwest US" },
758 { "value" => "1000GENOMES:phase_3:BEB", "caption" => "Bengali in Bangladesh" },
759 { "value" => "1000GENOMES:phase_3:CDX", "caption" => "Chinese Dai in Xishuangbanna, China" },
760 { "value" => "1000GENOMES:phase_3:CEU", "caption" => "Utah residents with Northern and Western European ancestry" },
761 { "value" => "1000GENOMES:phase_3:CHB", "caption" => "Han Chinese in Bejing, China" },
762 { "value" => "1000GENOMES:phase_3:CHS", "caption" => "Southern Han Chinese, China" },
763 { "value" => "1000GENOMES:phase_3:CLM", "caption" => "Colombian in Medellin, Colombia" },
764 { "value" => "1000GENOMES:phase_3:ESN", "caption" => "Esan in Nigeria" },
765 { "value" => "1000GENOMES:phase_3:FIN", "caption" => "Finnish in Finland" },
766 { "value" => "1000GENOMES:phase_3:GBR", "caption" => "British in England and Scotland" },
767 { "value" => "1000GENOMES:phase_3:GIH", "caption" => "Gujarati Indian in Houston, TX" },
768 { "value" => "1000GENOMES:phase_3:IBS", "caption" => "Iberian populations in Spain" },
769 { "value" => "1000GENOMES:phase_3:ITU", "caption" => "Indian Telugu in the UK" },
770 { "value" => "1000GENOMES:phase_3:JPT", "caption" => "Japanese in Tokyo, Japan" },
771 { "value" => "1000GENOMES:phase_3:KHV", "caption" => "Kinh in Ho Chi Minh City, Vietnam" },
772 { "value" => "1000GENOMES:phase_3:LWK", "caption" => "Luhya in Webuye, Kenya" },
773 { "value" => "1000GENOMES:phase_3:MAG", "caption" => "Mandinka in The Gambia" },
774 { "value" => "1000GENOMES:phase_3:MSL", "caption" => "Mende in Sierra Leone" },
775 { "value" => "1000GENOMES:phase_3:MXL", "caption" => "Mexican Ancestry in Los Angeles, California" },
776 { "value" => "1000GENOMES:phase_3:PEL", "caption" => "Peruvian in Lima, Peru" },
777 { "value" => "1000GENOMES:phase_3:PJL", "caption" => "Punjabi in Lahore, Pakistan" },
778 { "value" => "1000GENOMES:phase_3:PUR", "caption" => "Puerto Rican in Puerto Rico" },
779 { "value" => "1000GENOMES:phase_3:STU", "caption" => "Sri Lankan Tamil in the UK" },
780 { "value" => "1000GENOMES:phase_3:TSI", "caption" => "Toscani in Italy" },
781 { "value" => "1000GENOMES:phase_3:YRI", "caption" => "Yoruba in Ibadan, Nigeria" },
782 ],
783 "value" => "1000GENOMES:phase_3:CEU",
784 },
785 {
786 "name" => "threshold",
787 "label" => "r2 cutoff",
788 "type" => "string",
789 "value" => 0.8,
790 },
791 ]
792 },
793
794 # SameCodon
795 {
796 "key" => "SameCodon",
797 "label" => "Variants in same codon",
798 "helptip" => "Reports existing variants that fall in the same codon",
799 "available" => 0,
800 "enabled" => 0,
801 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/SameCodon.pm",
802 "section" => "Variant data",
803 },
804 # LOVD
805 {
806 "key" => "LOVD",
807 "label" => "LOVD",
808 "helptip" => "Retrieves LOVD variation data",
809 "available" => 0,
810 "enabled" => 0,
811 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/LOVD.pm",
812 "section" => "Variant data",
813 },
814
815 # GO
816 {
817 "key" => "GO",
818 "label" => "Gene Ontology",
819 "helptip" => "Retrieves Gene Ontology terms associated with transcripts/translations via the Ensembl API",
820 "available" => 0,
821 "enabled" => 0,
822 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/GO.pm",
823 "section" => "Gene data",
824 },
825
826 # Downstream
827 {
828 "key" => "Downstream",
829 "label" => "Downstream",
830 "helptip" => "Predicts the downstream effects of a frameshift variant on the protein sequence of a transcript",
831 "available" => 0,
832 "enabled" => 0,
833 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/Downstream.pm",
834 },
835
836 # ProteinSeqs
837 {
838 "key" => "ProteinSeqs",
839 "label" => "Protein sequences",
840 "helptip" => "Prints out the reference and mutated protein sequences of any proteins found with non-synonymous mutations",
841 "available" => 0,
842 "enabled" => 0,
843 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/ProteinSeqs.pm",
844 },
845
846 # TSSDistance
847 {
848 "key" => "TSSDistance",
849 "label" => "TSS distance",
850 "helptip" => "Calculates the distance from the transcription start site for upstream variants ",
851 "available" => 0,
852 "enabled" => 0,
853 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/TSSDistance.pm",
854 },
855
856 # Phenotypes
857 {
858 "key" => "Phenotypes",
859 "label" => "Phenotypes",
860 "helptip" => "Retrieves overlapping phenotype annotations",
861 "available" => 0,
862 "enabled" => 0,
863 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/Phenotypes.pm",
864 },
865 # Draw
866 {
867 "key" => "Draw",
868 "label" => "Draw",
869 "helptip" => "Creates images of the transcript model showing variant location",
870 "available" => 0,
871 "enabled" => 0,
872 "requires_install" => 1,
873 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/Draw.pm",
874 },
875 # G2P
876 {
877 "key" => "G2P",
878 "label" => "G2P",
879 "helptip" => "Assesses variants using G2P allelic requirements for potential phenotype involvement.",
880 "available" => 0,
881 "enabled" => 0,
882 "requires_data" => 1,
883 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/G2P.pm",
884 },
885
886 # LocalID
887 {
888 "key" => "LocalID",
889 "label" => "LocalID",
890 "helptip" => "Allows you to use variant IDs as VEP input without making a database connection.",
891 "available" => 0,
892 "enabled" => 0,
893 "plugin_url" => "https://raw.githubusercontent.com/Ensembl/VEP_plugins/release/94/LocalID.pm",
894 },
895
896
897 ]
898 };