annotate variant_effect_predictor/Bio/EnsEMBL/Variation/BaseTranscriptVariation.pm @ 1:d6778b5d8382 draft default tip

Deleted selected files
author willmclaren
date Fri, 03 Aug 2012 10:05:43 -0400
parents 21066c0abaf5
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
1 =head1 LICENSE
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
2
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
3 Copyright (c) 1999-2012 The European Bioinformatics Institute and
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
4 Genome Research Limited. All rights reserved.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
5
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
6 This software is distributed under a modified Apache license.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
7 For license details, please see
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
8
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
9 http://www.ensembl.org/info/about/code_licence.html
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
10
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
11 =head1 CONTACT
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
12
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
13 Please email comments or questions to the public Ensembl
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
14 developers list at <dev@ensembl.org>.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
15
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
16 Questions may also be sent to the Ensembl help desk at
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
17 <helpdesk@ensembl.org>.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
18
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
19 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
20
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
21 =head1 NAME
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
22
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
23 Bio::EnsEMBL::Variation::BaseTranscriptVariation
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
24
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
25 =head1 SYNOPSIS
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
26
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
27 use Bio::EnsEMBL::Variation::BaseTranscriptVariation;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
28
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
29 =head1 DESCRIPTION
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
30
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
31 A helper class for representing an overlap of a Transcript and a
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
32 Variation (either sequence or structural). Should not be invoked directly.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
33
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
34 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
35
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
36 package Bio::EnsEMBL::Variation::BaseTranscriptVariation;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
37
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
38 use strict;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
39 use warnings;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
40
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
41 use Digest::MD5 qw(md5_hex);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
42
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
43 use Bio::EnsEMBL::Utils::Scalar qw(assert_ref check_ref);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
44 use Bio::EnsEMBL::Variation::Utils::VariationEffect qw(overlap within_cds);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
45
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
46 use base qw(Bio::EnsEMBL::Variation::VariationFeatureOverlap);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
47
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
48 =head2 transcript_stable_id
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
49
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
50 Description: Returns the stable_id of the associated Transcript
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
51 Returntype : string
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
52 Exceptions : none
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
53 Status : At Risk
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
54
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
55 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
56
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
57 sub transcript_stable_id {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
58 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
59 return $self->SUPER::_feature_stable_id(@_);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
60 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
61
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
62 =head2 transcript
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
63
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
64 Arg [1] : (optional) Bio::EnsEMBL::Transcript
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
65 Description: Get/set the associated Transcript
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
66 Returntype : Bio::EnsEMBL::Transcript
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
67 Exceptions : throws if argument is wrong type
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
68 Status : At Risk
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
69
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
70 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
71
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
72 sub transcript {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
73 my ($self, $transcript) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
74 assert_ref($transcript, 'Bio::EnsEMBL::Transcript') if $transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
75 return $self->SUPER::feature($transcript, 'Transcript');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
76 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
77
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
78 =head2 feature
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
79
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
80 Arg [1] : (optional) Bio::EnsEMBL::Transcript
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
81 Description: Get/set the associated Transcript (overriding the superclass feature method)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
82 Returntype : Bio::EnsEMBL::Transcript
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
83 Exceptions : throws if argument is wrong type
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
84 Status : At Risk
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
85
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
86 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
87
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
88 sub feature {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
89 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
90 return $self->transcript(@_);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
91 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
92
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
93 =head2 cdna_start
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
94
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
95 Arg [1] : (optional) int $start
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
96 Example : $cdna_start = $tv->cdna_start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
97 Description: Getter/Setter for the start position of this variation on the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
98 transcript in cDNA coordinates.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
99 Returntype : int
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
100 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
101 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
102 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
103
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
104 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
105
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
106 sub cdna_start {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
107 my ($self, $cdna_start) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
108
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
109 $self->{cdna_start} = $cdna_start if defined $cdna_start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
110
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
111 unless (exists $self->{cdna_start}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
112 my $cdna_coords = $self->cdna_coords;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
113
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
114 my ($first, $last) = ($cdna_coords->[0], $cdna_coords->[-1]);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
115
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
116 $self->{cdna_start} = $first->isa('Bio::EnsEMBL::Mapper::Gap') ? undef : $first->start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
117 $self->{cdna_end} = $last->isa('Bio::EnsEMBL::Mapper::Gap') ? undef : $last->end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
118 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
119
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
120 return $self->{cdna_start};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
121 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
122
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
123 =head2 cdna_end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
124
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
125 Arg [1] : (optional) int $end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
126 Example : $cdna_end = $tv->cdna_end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
127 Description: Getter/Setter for the end position of this variation on the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
128 transcript in cDNA coordinates.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
129 Returntype : int
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
130 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
131 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
132 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
133
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
134 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
135
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
136 sub cdna_end {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
137 my ($self, $cdna_end) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
138
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
139 $self->{cdna_end} = $cdna_end if defined $cdna_end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
140
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
141 # call cdna_start to calculate the start and end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
142 $self->cdna_start unless exists $self->{cdna_end};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
143
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
144 return $self->{cdna_end};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
145 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
146
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
147 =head2 cds_start
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
148
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
149 Arg [1] : (optional) int $start
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
150 Example : $cds_start = $tv->cds_start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
151 Description: Getter/Setter for the start position of this variation on the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
152 transcript in CDS coordinates.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
153 Returntype : int
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
154 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
155 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
156 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
157
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
158 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
159
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
160 sub cds_start {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
161 my ($self, $cds_start) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
162
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
163 $self->{cds_start} = $cds_start if defined $cds_start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
164
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
165 unless (exists $self->{cds_start}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
166 my $cds_coords = $self->cds_coords;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
167
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
168 my ($first, $last) = ($cds_coords->[0], $cds_coords->[-1]);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
169 my $exon_phase = $self->transcript->start_Exon->phase;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
170
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
171 $self->{cds_start} = $first->isa('Bio::EnsEMBL::Mapper::Gap') ? undef : $first->start + ($exon_phase > 0 ? $exon_phase : 0);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
172 $self->{cds_end} = $last->isa('Bio::EnsEMBL::Mapper::Gap') ? undef : $last->end + ($exon_phase > 0 ? $exon_phase : 0);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
173 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
174
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
175 return $self->{cds_start};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
176 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
177
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
178 =head2 cds_end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
179
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
180 Arg [1] : (optional) int $end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
181 Example : $cds_end = $tv->cds_end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
182 Description: Getter/Setter for the end position of this variation on the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
183 transcript in CDS coordinates.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
184 Returntype : int
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
185 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
186 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
187 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
188
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
189 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
190
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
191 sub cds_end {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
192 my ($self, $cds_end) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
193
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
194 $self->{cds_end} = $cds_end if defined $cds_end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
195
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
196 # call cds_start to calculate the start and end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
197 $self->cds_start unless exists $self->{cds_end};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
198
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
199 return $self->{cds_end};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
200 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
201
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
202 =head2 translation_start
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
203
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
204 Arg [1] : (optional) int $start
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
205 Example : $translation_start = $tv->translation_start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
206 Description: Getter/Setter for the start position of this variation on the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
207 transcript in peptide coordinates.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
208 Returntype : int
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
209 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
210 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
211 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
212
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
213 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
214
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
215 sub translation_start {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
216 my ($self, $translation_start) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
217
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
218 $self->{translation_start} = $translation_start if defined $translation_start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
219
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
220 unless (exists $self->{translation_start}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
221 my $translation_coords = $self->translation_coords;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
222
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
223 my ($first, $last) = ($translation_coords->[0], $translation_coords->[-1]);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
224
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
225 $self->{translation_start} = $first->isa('Bio::EnsEMBL::Mapper::Gap') ? undef : $first->start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
226 $self->{translation_end} = $last->isa('Bio::EnsEMBL::Mapper::Gap') ? undef : $last->end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
227 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
228
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
229 return $self->{translation_start};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
230 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
231
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
232
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
233 =head2 translation_end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
234
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
235 Arg [1] : (optional) int $end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
236 Example : $transaltion_end = $tv->translation_end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
237 Description: Getter/Setter for the end position of this variation on the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
238 transcript in peptide coordinates.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
239 Returntype : int
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
240 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
241 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
242 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
243
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
244 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
245
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
246 sub translation_end {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
247 my ($self, $translation_end) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
248
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
249 $self->{translation_end} = $translation_end if defined $translation_end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
250
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
251 # call translation_start to calculate the start and end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
252 $self->translation_start unless exists $self->{translation_end};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
253
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
254 return $self->{translation_end};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
255 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
256
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
257 =head2 cdna_coords
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
258
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
259 Description: Use the TranscriptMapper to calculate the cDNA
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
260 coordinates of this variation
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
261 Returntype : listref of Bio::EnsEMBL::Coordinate and Bio::EnsEMBL::Gap objects
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
262 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
263 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
264 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
265
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
266 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
267
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
268 sub cdna_coords {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
269 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
270
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
271 unless ($self->{_cdna_coords}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
272 my $vf = $self->base_variation_feature;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
273 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
274 $self->{_cdna_coords} = [ $self->_mapper->genomic2cdna($vf->start, $vf->end, $tran->strand) ];
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
275 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
276
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
277 return $self->{_cdna_coords};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
278 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
279
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
280 =head2 cds_coords
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
281
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
282 Description: Use the TranscriptMapper to calculate the CDS
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
283 coordinates of this variation
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
284 Returntype : listref of Bio::EnsEMBL::Coordinate and Bio::EnsEMBL::Gap objects
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
285 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
286 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
287 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
288
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
289 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
290
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
291 sub cds_coords {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
292 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
293
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
294 unless ($self->{_cds_coords}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
295 my $vf = $self->base_variation_feature;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
296 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
297 $self->{_cds_coords} = [ $self->_mapper->genomic2cds($vf->start, $vf->end, $tran->strand) ];
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
298 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
299
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
300 return $self->{_cds_coords};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
301 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
302
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
303 =head2 translation_coords
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
304
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
305 Description: Use the TranscriptMapper to calculate the peptide
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
306 coordinates of this variation
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
307 Returntype : listref of Bio::EnsEMBL::Coordinate and Bio::EnsEMBL::Gap objects
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
308 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
309 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
310 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
311
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
312 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
313
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
314 sub translation_coords {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
315 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
316
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
317 unless ($self->{_translation_coords}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
318 my $vf = $self->base_variation_feature;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
319 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
320 $self->{_translation_coords} = [ $self->_mapper->genomic2pep($vf->start, $vf->end, $tran->strand) ];
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
321 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
322
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
323 return $self->{_translation_coords};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
324 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
325
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
326
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
327 =head2 distance_to_transcript
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
328
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
329 Arg [1] : (optional) int $distance
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
330 Example : $distance = $tv->distance_to_transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
331 Description: Getter/Setter for the distance of this variant to the transcript.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
332 This is the shortest distance between variant start/end and
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
333 transcript start/end, so if a variant falls 5' of a transcript
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
334 on the forward strand this distance will be that between the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
335 variant end and the transcript start; if it falls 3' it will be
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
336 the distance between the variant start and the transcript end.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
337 Returntype : int
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
338 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
339 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
340 Status : Stable
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
341
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
342 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
343
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
344 sub distance_to_transcript {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
345 my ($self, $distance) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
346
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
347 $self->{distance_to_transcript} = $distance if defined $distance;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
348
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
349 unless (exists $self->{distance_to_transcript}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
350 my $vf = $self->base_variation_feature;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
351 my $tr = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
352
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
353 my @dists = (
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
354 $vf->start - $tr->start,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
355 $vf->start - $tr->end,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
356 $vf->end - $tr->start,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
357 $vf->end - $tr->end
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
358 );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
359
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
360 # make positive if <0 and sort
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
361 @dists = sort {$a <=> $b} map {$_ < 0 ? 0 - $_ : $_} @dists;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
362
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
363 $self->{distance_to_transcript} = $dists[0];
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
364 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
365
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
366 return $self->{distance_to_transcript};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
367 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
368
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
369 =head2 get_overlapping_ProteinFeatures
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
370
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
371 Description: Find any ProteinFeatures (e.g. pfam or interpro domains etc.) that
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
372 the associated variation feature lies in
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
373 Returntype : listref of Bio::EnsEMBL::ProteinFeatures (possibly empty)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
374 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
375 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
376 Status : At Risk
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
377
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
378 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
379
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
380 sub get_overlapping_ProteinFeatures {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
381 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
382
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
383 unless (exists $self->{_protein_features}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
384
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
385 $self->{_protein_features } = [];
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
386
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
387 my $tl = $self->transcript->translation;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
388
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
389 if (defined $tl) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
390
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
391 my $tl_start = $self->translation_start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
392 my $tl_end = $self->translation_end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
393
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
394 if (defined $tl_start && defined $tl_end) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
395 for my $feat (@{ $tl->get_all_ProteinFeatures }) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
396 if (overlap($feat->start, $feat->end, $tl_start, $tl_end)) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
397 push @{ $self->{_protein_features} }, $feat;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
398 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
399 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
400 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
401 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
402 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
403
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
404 return $self->{_protein_features};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
405 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
406
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
407 =head2 exon_number
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
408
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
409 Description: Identify which exon(s) this variant falls in
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
410 Returntype : '/'-separated string containing the exon number(s) and the total
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
411 number of exons in this transcript, or undef if this variant
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
412 does not fall in any exons
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
413 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
414 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
415 Status : At Risk
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
416
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
417 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
418
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
419 sub exon_number {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
420 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
421 $self->_exon_intron_number unless exists $self->{exon_number};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
422 return $self->{exon_number};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
423 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
424
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
425 =head2 intron_number
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
426
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
427 Description: Identify which intron(s) this variant falls in
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
428 Returntype : '/'-separated string containing the intron number(s) and the total
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
429 number of introns in this transcript, or undef if this variant
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
430 does not fall in any introns
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
431 Exceptions : None
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
432 Caller : general
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
433 Status : At Risk
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
434
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
435 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
436
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
437 sub intron_number {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
438 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
439 $self->_exon_intron_number unless exists $self->{intron_number};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
440 return $self->{intron_number};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
441 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
442
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
443 sub _exon_intron_number {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
444 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
445
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
446 # work out which exon or intron this variant falls in
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
447
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
448 # ensure the keys exist so even if we don't fall in an exon
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
449 # or intron we'll only call this method once
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
450
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
451 $self->{exon_number} = $self->{intron_number} = undef;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
452
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
453 my $vf = $self->base_variation_feature;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
454
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
455 my $vf_start = $vf->start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
456 my $vf_end = $vf->end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
457
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
458 my $strand = $self->transcript->strand;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
459
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
460 my $exons = $self->_exons;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
461
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
462 my $tot_exons = scalar(@$exons);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
463
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
464 my $exon_count = 0;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
465
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
466 my $prev_exon;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
467
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
468 my (@overlapped_exons, @overlapped_introns);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
469
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
470 for my $exon (@$exons) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
471
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
472 $exon_count++;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
473
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
474 if (overlap($vf_start, $vf_end, $exon->start, $exon->end)) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
475 push @overlapped_exons, $exon_count;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
476 #$self->{exon_number} = defined($self->{exon_number}) ? $self->{exon_number}.",".$exon_count : $exon_count;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
477 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
478
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
479 if ($prev_exon) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
480 my $intron_start = $strand == 1 ? $prev_exon->end + 1 : $exon->end + 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
481 my $intron_end = $strand == 1 ? $exon->start - 1 : $prev_exon->start - 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
482
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
483 if ($prev_exon && overlap($vf_start, $vf_end, $intron_start, $intron_end)) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
484 push @overlapped_introns, $exon_count - 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
485 #$self->{intron_number} = defined($self->{intron_number}) ? $self->{intron_number}.",".($exon_count - 1) : ($exon_count - 1);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
486 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
487 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
488
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
489 $prev_exon = $exon;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
490 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
491
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
492 if(@overlapped_exons) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
493 $self->{exon_number} = (scalar @overlapped_exons > 1 ? $overlapped_exons[0].'-'.$overlapped_exons[-1] : $overlapped_exons[0]).'/'.$tot_exons;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
494 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
495 if(@overlapped_introns) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
496 $self->{intron_number} = (scalar @overlapped_introns > 1 ? $overlapped_introns[0].'-'.$overlapped_introns[-1] : $overlapped_introns[0]).'/'.($tot_exons - 1);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
497 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
498 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
499
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
500 sub _intron_effects {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
501 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
502
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
503 # internal method used by Bio::EnsEMBL::Variation::Utils::VariationEffect
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
504 # when calculating various consequence types
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
505
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
506 # this method is a major bottle neck in the effect calculation code so
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
507 # we cache results and use local variables instead of method calls where
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
508 # possible to speed things up - caveat bug-fixer!
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
509
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
510 unless ($self->{_intron_effects}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
511
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
512 my $vf = $self->base_variation_feature;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
513
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
514 my $intron_effects = {};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
515
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
516 my $found_effect = 0;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
517
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
518 my $vf_start = $vf->start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
519 my $vf_end = $vf->end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
520
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
521 my $insertion = $vf_start == $vf_end+1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
522
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
523 for my $intron (@{ $self->_introns }) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
524
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
525 my $intron_start = $intron->start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
526 my $intron_end = $intron->end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
527
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
528 # under various circumstances the genebuild process can introduce
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
529 # artificial short (<= 12 nucleotide) introns into transcripts
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
530 # (e.g. to deal with errors in the reference sequence etc.), we
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
531 # don't want to categorise variations that fall in these introns
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
532 # as intronic, or as any kind of splice variant
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
533
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
534 my $frameshift_intron = ( abs($intron_end - $intron_start) <= 12 );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
535
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
536 if ($frameshift_intron) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
537 if (overlap($vf_start, $vf_end, $intron_start, $intron_end)) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
538 $intron_effects->{within_frameshift_intron} = 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
539 next;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
540 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
541 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
542
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
543 if (overlap($vf_start, $vf_end, $intron_start, $intron_start+1)) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
544 $intron_effects->{start_splice_site} = 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
545 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
546
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
547 if (overlap($vf_start, $vf_end, $intron_end-1, $intron_end)) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
548 $intron_effects->{end_splice_site} = 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
549 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
550
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
551 # we need to special case insertions between the donor and acceptor sites
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
552
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
553 if (overlap($vf_start, $vf_end, $intron_start+2, $intron_end-2) or
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
554 ($insertion && ($vf_start == $intron_start+2 || $vf_end == $intron_end-2)) ) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
555 $intron_effects->{intronic} = 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
556 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
557
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
558 # the definition of splice_region (SO:0001630) is "within 1-3 bases
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
559 # of the exon or 3-8 bases of the intron", the intron start is the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
560 # first base of the intron so we only need to add or subtract 7 from
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
561 # it to get the correct coordinate. We also need to special case
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
562 # insertions between the edge of an exon and a donor or acceptor site
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
563 # and between a donor or acceptor site and the intron
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
564
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
565 if ( overlap($vf_start, $vf_end, $intron_start-3, $intron_start-1) or
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
566 overlap($vf_start, $vf_end, $intron_start+2, $intron_start+7) or
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
567 overlap($vf_start, $vf_end, $intron_end-7, $intron_end-2 ) or
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
568 overlap($vf_start, $vf_end, $intron_end+1, $intron_end+3 ) or
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
569 ($insertion && (
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
570 $vf_start == $intron_start ||
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
571 $vf_end == $intron_end ||
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
572 $vf_start == $intron_start+2 ||
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
573 $vf_end == $intron_end-2
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
574 ) )) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
575
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
576 $intron_effects->{splice_region} = 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
577 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
578 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
579
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
580 $self->{_intron_effects} = $intron_effects;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
581 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
582
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
583 return $self->{_intron_effects};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
584 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
585
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
586 # NB: the methods below all cache their data in the associated transcript itself, this
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
587 # gives a significant speed up when you are calculating the effect of all variations
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
588 # on a transcript, and means that the cache will be freed when the transcript itself
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
589 # is garbage collected rather than us having to maintain a transcript feature cache
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
590 # ourselves
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
591
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
592 sub _introns {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
593 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
594
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
595 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
596
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
597 my $introns = $tran->{_variation_effect_feature_cache}->{introns} ||= $tran->get_all_Introns;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
598
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
599 return $introns;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
600 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
601
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
602 sub _exons {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
603 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
604
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
605 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
606
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
607 my $exons = $tran->{_variation_effect_feature_cache}->{exons} ||= $tran->get_all_Exons;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
608
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
609 return $exons;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
610 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
611
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
612 sub _mapper {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
613 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
614
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
615 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
616
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
617 my $mapper = $tran->{_variation_effect_feature_cache}->{mapper} ||= $tran->get_TranscriptMapper;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
618
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
619 return $mapper;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
620 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
621 sub _translateable_seq {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
622 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
623
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
624 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
625
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
626 my $tran_seq = $tran->{_variation_effect_feature_cache}->{translateable_seq} ||= $tran->translateable_seq;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
627
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
628 return $tran_seq;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
629 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
630
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
631 sub _peptide {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
632 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
633
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
634 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
635
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
636 my $peptide = $tran->{_variation_effect_feature_cache}->{peptide};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
637
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
638 unless ($peptide) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
639 my $translation = $tran->translate;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
640 $peptide = $translation ? $translation->seq : undef;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
641 $tran->{_variation_effect_feature_cache}->{peptide} = $peptide;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
642 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
643
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
644 return $peptide;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
645 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
646
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
647 sub _translation_md5 {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
648 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
649
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
650 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
651
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
652 unless (exists $tran->{_variation_effect_feature_cache}->{translation_md5}) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
653 $tran->{_variation_effect_feature_cache}->{translation_md5} =
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
654 $self->_peptide ? md5_hex($self->_peptide) : undef;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
655 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
656
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
657 return $tran->{_variation_effect_feature_cache}->{translation_md5};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
658 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
659
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
660 sub _codon_table {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
661 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
662
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
663 my $tran = $self->transcript;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
664
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
665 my $codon_table = $tran->{_variation_effect_feature_cache}->{codon_table};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
666
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
667 unless ($codon_table) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
668 # for mithocondrial dna we need to to use a different codon table
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
669 my $attrib = $tran->slice->get_all_Attributes('codon_table')->[0];
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
670
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
671 # default to the vertebrate codon table which is denoted as 1
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
672 $codon_table = $attrib ? $attrib->value : 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
673
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
674 $tran->{_variation_effect_feature_cache}->{codon_table} = $codon_table
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
675 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
676
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
677 return $codon_table;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
678 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
679
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
680 1;