annotate variant_effect_predictor/Bio/EnsEMBL/Intron.pm @ 0:1f6dce3d34e0

Uploaded
author mahtabm
date Thu, 11 Apr 2013 02:01:53 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 =head1 LICENSE
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 Copyright (c) 1999-2012 The European Bioinformatics Institute and
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4 Genome Research Limited. All rights reserved.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 This software is distributed under a modified Apache license.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7 For license details, please see
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9 http://www.ensembl.org/info/about/code_licence.html
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11 =head1 CONTACT
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13 Please email comments or questions to the public Ensembl
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14 developers list at <dev@ensembl.org>.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16 Questions may also be sent to the Ensembl help desk at
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17 <helpdesk@ensembl.org>.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21 =head1 NAME Bio::EnsEMBL::Intron - A class representing an Intron
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25 $intron = Bio::EnsEMBL::Intron->new( exon1, exon2, $analysis );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30 package Bio::EnsEMBL::Intron;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32 use warnings;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34 use Bio::EnsEMBL::Utils::Exception qw( warning throw );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36 use base qw(Bio::EnsEMBL::Feature);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38 =head2 new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40 Arg [1] : Bio::EnsEMBL::Exon The 5' exon for the intron; required
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41 Arg [2] : Bio::EnsEMBL::Exon The 3' exon for the intron; required
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42 Arg [3] : Bio::EnsEMBL::Analysis Analysis to link to this Intron
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43 Example : $intron = new Bio::EnsEMBL::Intron($exon1, $exon2)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44 Description: Create an Intron object from two exons and an optional analysis
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45 Returntype : Bio::EnsEMBL::Intron
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46 Exceptions : exons not on the same strand or slice.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47 Caller : general
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48 Status : Stable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52 sub new {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53 my ( $proto, $e1, $e2, $analysis ) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55 my $class = ref $proto || $proto;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57 my $self = $class->SUPER::new();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59 if ( $e1->strand() == -1 ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60 $self->{'end'} = $e1->start() - 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61 $self->{'start'} = $e2->end() + 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63 $self->{'start'} = $e1->end() + 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64 $self->{'end'} = $e2->start() - 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67 if ( $e1->strand() != $e2->strand() ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68 # throw("Exons on different strand. Not allowed");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70 $self->{'strand'} = $e1->strand();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73 if ( $e1->slice() ne $e2->slice() ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74 if ( ( $e1->slice()->seq_region_name() ne
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75 $e2->slice()->seq_region_name() )
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76 && ( $e1->slice()->coord_system_name() ne
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77 $e2->slice()->coord_system_name() ) )
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78 {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79 throw("Exons on different slices. Not allowed");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81 warning("Exons have different slice references to the same seq_region");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84 $self->{'slice'} = $e1->slice();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87 if($analysis) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88 $self->analysis($analysis);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91 $self->{'prev'} = $e1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92 $self->{'next'} = $e2;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94 return $self;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95 } ## end sub new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97 =head2 length
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100 Example : $length = $intron->length();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101 Description: Returns the length of this intron
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102 Returntype : Integer
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103 Exceptions : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104 Caller : general
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105 Status : Stable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109 sub length {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112 # TODO: Introns on circular slices, see Feature.pm but allow for
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113 # zero-length introns.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115 return $self->{'end'} - $self->{'start'} + 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119 =head2 prev_Exon
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122 Example : $exon = $intron->prev_Exon
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123 Description: Returns the exon before this Intron
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124 Returntype : Bio::EnsEMBL::Exon
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125 Exceptions : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126 Caller : general
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127 Status : Stable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131 sub prev_Exon {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132 my ($self) = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134 return $self->{'prev'};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 =head2 next_Exon
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141 Example : $exon = $intron->next_Exon
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142 Description: Returns the exon after this Intron
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143 Returntype : Bio::EnsEMBL::Exon
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144 Exceptions : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145 Caller : general
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146 Status : Stable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150 sub next_Exon {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151 my ($self) = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
153 return $self->{'next'};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
154 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
155
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
156 =head2 is_splice_canonical
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
157
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
158 Example : my $canonical = $intron->is_splice_canonical();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
159 Description : Indicates if the splice site is considered normal. This means
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
160 splice site variants equal to (D == donor, A == acceptor)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
161 GT (D) => AG (A)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
162 AT (D) => AC (A)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
163 GC (D) => AG (A)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
164 Returntype : Boolean indicating if the splice was as expected
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
165 Exceptions : See splice_seq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
166
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
167 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
168
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
169 sub is_splice_canonical {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
170 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
171 my $splice = join q{}, @{$self->splice_seq()};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
172 my $canonical = {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
173 'GTAG' => 1, 'ATAC' => 1, 'GCAG' => 1
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
174 }->{$splice};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
175 return $canonical || 0;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
176 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
177
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
178 =head2 splice_seq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
179
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
180 Example : my ($donor, $acceptor) = @{$intron->splice_seq};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
181 Description : Get the donor and acceptor splice sites for this intron
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
182 Returntype : ArrayRef[String] The donor and acceptor sequences as Strings
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
183 Exceptions : Thrown if a feature Slice cannot be found
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
184
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
185 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
186
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
187 sub splice_seq {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
188 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
189 my $slice = $self->feature_Slice();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
190 throw "Cannot retrieve feature_Slice() for this Intron" unless $slice;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
191 my $length = $self->length();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
192 my $donor_seq = uc($slice->subseq(1,2));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
193 my $acceptor_seq = uc($slice->subseq($length - 1, $length));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
194 return [$donor_seq, $acceptor_seq];
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
195 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
196
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
197 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
198
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
199