annotate dir_plugins/PolyPhen_SIFT.pm @ 3:49397129aec0 draft

Uploaded
author dvanzessen
date Mon, 15 Jul 2019 05:20:39 -0400
parents e545d0a25ffe
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
1 =head1 LICENSE
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
2
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
3 Copyright [1999-2015] Wellcome Trust Sanger Institute and the EMBL-European Bioinformatics Institute
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
4 Copyright [2016-2018] EMBL-European Bioinformatics Institute
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
5
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
6 Licensed under the Apache License, Version 2.0 (the "License");
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
7 you may not use this file except in compliance with the License.
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
8 You may obtain a copy of the License at
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
9
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
10 http://www.apache.org/licenses/LICENSE-2.0
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
11
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
12 Unless required by applicable law or agreed to in writing, software
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
13 distributed under the License is distributed on an "AS IS" BASIS,
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
14 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
15 See the License for the specific language governing permissions and
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
16 limitations under the License.
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
17
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
18 =head1 CONTACT
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
19
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
20 Ensembl <http://www.ensembl.org/info/about/contact/index.html>
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
21
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
22 =cut
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
23
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
24 =head1 NAME
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
25
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
26 PolyPhen_SIFT
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
27
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
28 =head1 SYNOPSIS
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
29
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
30 mv PolyPhen_SIFT.pm ~/.vep/Plugins
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
31 ./vep -i variations.vcf -cache --plugin PolyPhen_SIFT
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
32
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
33 =head1 DESCRIPTION
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
34
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
35 A VEP plugin that retrieves PolyPhen and SIFT predictions from a
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
36 locally constructed sqlite database. It can be used when your main
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
37 source of VEP transcript annotation (e.g. a GFF file or GFF-based cache)
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
38 does not contain these predictions.
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
39
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
40 You must either download or create a sqlite database of the predictions.
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
41 You may point to the file by adding db=[file] as a parameter:
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
42
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
43 --plugin PolyPhen_SIFT,db=[file]
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
44
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
45 Human predictions (assembly-independent) are available here:
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
46
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
47 https://dl.dropboxusercontent.com/u/12936195/homo_sapiens.PolyPhen_SIFT.db
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
48
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
49 (Please note the download location of this file may change)
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
50
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
51 Place this file in $HOME/.vep to have the plugin find it automatically.
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
52 You may change this directory by adding dir=[dir] as a parameter:
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
53
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
54 --plugin PolyPhen_SIFT,dir=[dir]
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
55
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
56 To create the database, you must have an active database connection
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
57 (i.e. not using --offline) and add create_db=1 as a parameter:
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
58
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
59 --plugin PolyPhen_SIFT,create_db=1
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
60
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
61 *** NB: this will take some time!!! ***
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
62
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
63 By default the file is created as:
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
64
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
65 ${HOME}/.vep/[species].PolyPhen_SIFT.db
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
66
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
67 =cut
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
68
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
69 package PolyPhen_SIFT;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
70
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
71 use strict;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
72 use warnings;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
73 use DBI;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
74 use Digest::MD5 qw(md5_hex);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
75 use Bio::EnsEMBL::Variation::ProteinFunctionPredictionMatrix;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
76
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
77 use Bio::EnsEMBL::Variation::Utils::BaseVepPlugin;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
78
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
79 use base qw(Bio::EnsEMBL::Variation::Utils::BaseVepPlugin);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
80
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
81 sub new {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
82 my $class = shift;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
83
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
84 my $self = $class->SUPER::new(@_);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
85
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
86 my $param_hash = $self->params_to_hash();
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
87
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
88 my $species = $self->config->{species} || 'homo_sapiens';
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
89 my $dir = $param_hash->{dir} || $self->{config}->{dir};
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
90 my $db = $param_hash->{db} || $dir.'/'.$species.'.PolyPhen_SIFT.db';
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
91
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
92 # create DB?
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
93 if($param_hash->{create_db}) {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
94 die("ERROR: DB file $db already exists - remove and re-run to overwrite\n") if -e $db;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
95
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
96 $self->{dbh} = DBI->connect("dbi:SQLite:dbname=$db","","");
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
97 $self->{dbh}->do("CREATE TABLE predictions(md5, analysis, matrix)");
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
98
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
99 my $sth = $self->{dbh}->prepare("INSERT INTO predictions VALUES(?, ?, ?)");
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
100
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
101 my $mysql = Bio::EnsEMBL::Registry->get_adaptor($species, 'variation', 'variation')->db->dbc->prepare(qq{
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
102 SELECT m.translation_md5, a.value, p.prediction_matrix
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
103 FROM translation_md5 m, attrib a, protein_function_predictions p
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
104 WHERE m.translation_md5_id = p.translation_md5_id
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
105 AND p.analysis_attrib_id = a.attrib_id
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
106 }, {mysql_use_result => 1});
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
107
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
108 my ($md5, $attrib, $matrix);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
109 $mysql->execute();
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
110 $mysql->bind_columns(\$md5, \$attrib, \$matrix);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
111 $sth->execute($md5, $attrib, $matrix) while $mysql->fetch();
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
112 $sth->finish();
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
113 $mysql->finish();
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
114
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
115 $self->{dbh}->do("CREATE INDEX md5_idx ON predictions(md5)");
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
116 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
117
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
118 die("ERROR: DB file $db not found - you need to download or create it first, see documentation in plugin file\n") unless -e $db;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
119
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
120 $self->{initial_pid} = $$;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
121 $self->{db_file} = $db;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
122
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
123 $self->{dbh} ||= DBI->connect("dbi:SQLite:dbname=$db","","");
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
124 $self->{get_sth} = $self->{dbh}->prepare("SELECT md5, analysis, matrix FROM predictions WHERE md5 = ?");
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
125
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
126 return $self;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
127 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
128
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
129 sub feature_types {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
130 return ['Transcript'];
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
131 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
132
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
133 sub get_header_info {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
134 return {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
135 PolyPhen_humdiv_score => 'PolyPhen humdiv score from PolyPhen_SIFT plugin',
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
136 PolyPhen_humdiv_pred => 'PolyPhen humdiv prediction from PolyPhen_SIFT plugin',
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
137 PolyPhen_humvar_score => 'PolyPhen humvar score from PolyPhen_SIFT plugin',
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
138 PolyPhen_humvar_pred => 'PolyPhen humvar prediction from PolyPhen_SIFT plugin',
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
139 SIFT_score => 'SIFT score from PolyPhen_SIFT plugin',
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
140 SIFT_pred => 'SIFT prediction from PolyPhen_SIFT plugin',
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
141 };
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
142 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
143
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
144 sub run {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
145 my ($self, $tva) = @_;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
146
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
147 # only for missense variants
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
148 return {} unless grep {$_->SO_term eq 'missense_variant'} @{$tva->get_all_OverlapConsequences};
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
149
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
150 my $tr = $tva->transcript;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
151 my $tr_vep_cache = $tr->{_variation_effect_feature_cache} ||= {};
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
152
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
153 ## if predictions are not available for both tools in the cache, look in the SQLite database
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
154 unless(exists($tr_vep_cache->{protein_function_predictions}) &&
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
155 $tva->sift_prediction() && $tva->polyphen_prediction()
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
156 ){
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
157
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
158 # get peptide
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
159 unless($tr_vep_cache->{peptide}) {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
160 my $translation = $tr->translate;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
161 return {} unless $translation;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
162 $tr_vep_cache->{peptide} = $translation->seq;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
163 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
164
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
165 # get data, indexed on md5 of peptide sequence
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
166 my $md5 = md5_hex($tr_vep_cache->{peptide});
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
167
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
168 my $data = $self->fetch_from_cache($md5);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
169
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
170 unless($data) {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
171
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
172 # forked, reconnect to DB
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
173 if($$ != $self->{initial_pid}) {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
174 $self->{dbh} = DBI->connect("dbi:SQLite:dbname=".$self->{db_file},"","");
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
175 $self->{get_sth} = $self->{dbh}->prepare("SELECT md5, analysis, matrix FROM predictions WHERE md5 = ?");
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
176
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
177 # set this so only do once per fork
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
178 $self->{initial_pid} = $$;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
179 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
180
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
181 $self->{get_sth}->execute($md5);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
182
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
183 $data = {};
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
184
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
185 while(my $arrayref = $self->{get_sth}->fetchrow_arrayref) {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
186 my $analysis = $arrayref->[1];
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
187 my ($super_analysis, $sub_analysis) = split('_', $arrayref->[1]);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
188
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
189 $data->{$analysis} = Bio::EnsEMBL::Variation::ProteinFunctionPredictionMatrix->new(
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
190 -translation_md5 => $arrayref->[0],
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
191 -analysis => $super_analysis,
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
192 -sub_analysis => $sub_analysis,
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
193 -matrix => $arrayref->[2]
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
194 );
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
195 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
196
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
197 $self->add_to_cache($md5, $data);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
198 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
199
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
200 $tr_vep_cache->{protein_function_predictions} = $data;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
201 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
202
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
203 my $return = {};
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
204
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
205 foreach my $tool_string(qw(SIFT PolyPhen_humdiv PolyPhen_humvar)) {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
206 my ($tool, $analysis) = split('_', $tool_string);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
207 my $lc_tool = lc($tool);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
208
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
209 my $pred_meth = $lc_tool.'_prediction';
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
210 my $score_meth = $lc_tool.'_score';
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
211
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
212 my $pred = $tva->$pred_meth($analysis);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
213
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
214 if($pred) {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
215 $pred =~ s/\s+/\_/g;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
216 $pred =~ s/\_\-\_/\_/g;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
217 $return->{$tool_string.'_pred'} = $pred;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
218
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
219 my $score = $tva->$score_meth($analysis);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
220 $return->{$tool_string.'_score'} = $score if defined($score);
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
221 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
222 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
223
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
224 return $return;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
225 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
226
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
227 sub fetch_from_cache {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
228 my $self = shift;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
229 my $md5 = shift;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
230
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
231 my $cache = $self->{_cache} ||= [];
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
232
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
233 my ($data) = map {$_->{data}} grep {$_->{md5} eq $md5} @$cache;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
234 return $data;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
235 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
236
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
237 sub add_to_cache {
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
238 my $self = shift;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
239 my $md5 = shift;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
240 my $data = shift;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
241
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
242 my $cache = $self->{_cache} ||= [];
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
243 push @$cache, {md5 => $md5, data => $data};
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
244
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
245 shift @$cache while scalar @$cache > 50;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
246 }
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
247
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
248 1;
e545d0a25ffe Uploaded
dvanzessen
parents:
diff changeset
249