annotate variant_effect_predictor/Bio/LiveSeq/Translation.pm @ 0:2bc9b66ada89 draft default tip

Uploaded
author mahtabm
date Thu, 11 Apr 2013 06:29:17 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: Translation.pm,v 1.12 2002/09/25 08:57:52 heikki Exp $
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
2 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
3 # bioperl module for Bio::LiveSeq::Translation
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
4 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
5 # Cared for by Joseph Insana <insana@ebi.ac.uk> <jinsana@gmx.net>
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
6 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
7 # Copyright Joseph Insana
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
8 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
9 # You may distribute this module under the same terms as perl itself
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
10 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
11 # POD documentation - main docs before the code
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
12
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
13 =head1 NAME
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
14
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
15 Bio::LiveSeq::Translation - Translation class for LiveSeq
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
16
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
17 =head1 SYNOPSIS
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
18
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
19 #documentation needed
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
20
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
21 =head1 DESCRIPTION
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
22
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
23 This stores informations about aminoacids translations of transcripts.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
24 The implementation is that a Translation object is the translation of
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
25 a Transcript object, with different possibilities of manipulation,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
26 different coordinate system and eventually its own ranges (protein domains).
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
27
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
28 =head1 AUTHOR - Joseph A.L. Insana
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
29
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
30 Email: Insana@ebi.ac.uk, jinsana@gmx.net
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
31
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
32 Address:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
33
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
34 EMBL Outstation, European Bioinformatics Institute
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
35 Wellcome Trust Genome Campus, Hinxton
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
36 Cambs. CB10 1SD, United Kingdom
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
37
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
38 =head1 APPENDIX
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
39
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
40 The rest of the documentation details each of the object
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
41 methods. Internal methods are usually preceded with a _
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
42
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
43 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
44
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
45 # Let the code begin...
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
46
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
47 package Bio::LiveSeq::Translation;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
48 $VERSION=1.8;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
49
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
50 # Version history:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
51 # Thu Mar 23 14:41:52 GMT 2000 v.1.0 begun
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
52 # Sat Mar 25 04:08:59 GMT 2000 v 1.2 valid(), label(), position()
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
53 # Tue Mar 28 03:37:17 BST 2000 v 1.3 added inheritance from Transcript, subseq relies on it!
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
54 # Fri Mar 31 16:53:53 BST 2000 v 1.4 new seq() function that checks for stop codons: it now returns only up to the stop but doesn't continue if stop not found
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
55 # Fri Mar 31 18:45:07 BST 2000 v 1.41 now it asks for Transcript->downstream_seq
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
56 # Fri Mar 31 19:20:04 BST 2000 v 1.49 seq() now works correctly
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
57 # Thu Apr 13 00:10:29 BST 2000 v 1.5 start and end now take the information from Transcript
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
58 # Thu Apr 27 16:18:55 BST 2000 v 1.6 translation_table info added
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
59 # Thu May 11 17:30:41 BST 2000 v 1.66 position method updated so to return a position also for labels not in frame (not at 1st triplet position)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
60 # Mon May 22 14:59:14 BST 2000 v 1.7 labelsubseq added
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
61 # Mon May 22 15:22:12 BST 2000 v 1.71 labelsubseq tweaked for cases where startlabel==endlabel (no useless follow() query!)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
62 # Mon May 22 15:28:49 BST 2000 v 1.74 modified seq() so that the "*" is printed
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
63 # Wed Jun 7 04:02:18 BST 2000 v 1.75 added offset()
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
64 # Thu Jun 29 15:10:22 BST 2000 v 1.76 bug corrected for elongation mutations, if stop codon is not found downstream
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
65 # Wed Mar 28 16:37:37 BST 2001 v 1.8 carp -> warn,throw (coded methods in SeqI)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
66
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
67 use strict;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
68 #use Carp qw(croak carp cluck);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
69 use vars qw($VERSION @ISA);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
70 use Bio::LiveSeq::SeqI 3.2; # uses SeqI, inherits from it
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
71 use Bio::PrimarySeq;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
72 @ISA=qw(Bio::LiveSeq::Transcript );
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
73
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
74
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
75 =head2 new
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
76
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
77 Title : new
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
78 Usage : $protein = Bio::LiveSeq::Translation->new(-transcript => $transcr);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
79
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
80 Function: generates a new Bio::LiveSeq::Translation
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
81 Returns : reference to a new object of class Translation
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
82 Errorcode -1
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
83 Args : reference to an object of class Transcript
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
84
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
85 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
86
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
87 sub new {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
88 my ($thing, %args) = @_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
89 my $class = ref($thing) || $thing;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
90 my ($obj,%translation);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
91
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
92 my $transcript=$args{-transcript};
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
93
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
94 $obj = \%translation;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
95 $obj = bless $obj, $class;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
96
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
97 unless ($transcript) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
98 $obj->throw("$class not initialised because no -transcript given");
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
99 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
100 unless (ref($transcript) eq "Bio::LiveSeq::Transcript") {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
101 $obj->throw("$class not initialised because no object of class Transcript given");
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
102 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
103
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
104 #my $startbase = $transcript->start;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
105 #my $endbase = $transcript->end;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
106 my $strand = $transcript->strand;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
107 my $seq = $transcript->{'seq'};
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
108
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
109 $obj->{'strand'}=$strand;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
110 $obj->{'seq'}=$seq;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
111 $obj->{'transcript'}=$transcript;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
112 $obj->{'alphabet'}="protein";
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
113
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
114 $transcript->{'translation'}=$obj;# set the Translation ref into its Transcript
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
115 return $obj;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
116 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
117
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
118 =head2 get_Transcript
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
119
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
120 Title : valid
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
121 Usage : $transcript = $obj->get_Transcript()
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
122 Function: retrieves the reference to the object of class Transcript (if any)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
123 attached to a LiveSeq object
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
124 Returns : object reference
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
125 Args : none
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
126
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
127 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
128
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
129 sub get_Transcript {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
130 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
131 return ($self->{'transcript'});
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
132 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
133
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
134 # These get redefined here, overriding the SeqI ones
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
135
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
136 sub change {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
137 my ($self)=@_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
138 $self->warn("Cannot change a Translation object!\nChanges have to be issued at the nucleotide level!");
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
139 return (-1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
140 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
141 sub positionchange {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
142 my ($self)=@_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
143 $self->warn("Cannot change a Translation object!\nChanges have to be issued at the nucleotide level!");
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
144 return (-1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
145 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
146 sub labelchange {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
147 my ($self)=@_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
148 $self->warn("Cannot change a Translation object!\nChanges have to be issued at the nucleotide level!");
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
149 return (-1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
150 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
151
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
152 # this just returns the translation of the transcript, without checking for
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
153 # stop codons
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
154 sub transl_seq {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
155 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
156 my $transcript=$self->get_Transcript;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
157 my $translation=$transcript->translate(undef, undef, undef,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
158 $self->translation_table)->seq;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
159 return $translation;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
160 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
161
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
162 # version 1.74 -> now the "*" is printed
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
163 sub seq {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
164 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
165 my $proteinseq;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
166 my $transcript=$self->get_Transcript;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
167 my $translation=$transcript->translate(undef, undef, undef,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
168 $self->translation_table)->seq;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
169 my $stop_pos=index($translation,"*");
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
170 if ($stop_pos == -1) { # no stop present, continue downstream
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
171 my $downstreamseq=$transcript->downstream_seq();
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
172 #carp "the downstream is: $downstreamseq"; # debug
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
173 my $cdnaseq=$transcript->seq();
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
174 my $extendedseq = new Bio::PrimarySeq(-seq => "$cdnaseq$downstreamseq",
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
175 -alphabet => 'dna'
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
176 );
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
177
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
178 $translation=$extendedseq->translate(undef, undef, undef,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
179 $self->translation_table)->seq;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
180 #carp "the new translation is: $translation"; # debug
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
181 $stop_pos=index($translation,"*");
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
182 if ($stop_pos == -1) { # still no stop present, return warning
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
183 $self->warn("Warning: no stop codon found in the retrieved sequence downstream of Transcript ",1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
184 undef $stop_pos;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
185 $proteinseq=$translation;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
186 } else {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
187 $proteinseq=substr($translation,0,$stop_pos+1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
188 #carp "the new stopped translation is: $proteinseq, because the stop is at position $stop_pos"; # debug
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
189 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
190 } else {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
191 $proteinseq=substr($translation,0,$stop_pos+1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
192 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
193 return $proteinseq;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
194 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
195
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
196 sub length {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
197 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
198 my $seq=$self->seq;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
199 my $length=length($seq);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
200 return $length;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
201 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
202
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
203 sub all_labels {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
204 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
205 return $self->get_Transcript->all_labels;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
206 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
207
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
208 # counts in triplet. Only a label matching the beginning of a triplet coding
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
209 # for an aminoacid is considered valid when setting coordinate_start
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
210 # (i.e. only in frame!)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
211 sub valid {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
212 my ($self,$label)=@_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
213 my $i;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
214 my @labels=$self->get_Transcript->all_labels;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
215 my $length=$#labels;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
216 while ($i <= $length) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
217 if ($label == $labels[$i]) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
218 return (1); # found
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
219 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
220 $i=$i+3;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
221 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
222 return (0); # not found
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
223 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
224
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
225 # returns the label to the first nucleotide of the triplet coding for $position aminoacid
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
226 sub label {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
227 my ($self,$position)=@_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
228 my $firstlabel=$self->coordinate_start; # this is in_frame checked
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
229 if ($position > 0) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
230 $position=$position*3-2;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
231 } else { # if position = 0 this will be caught by Transcript, error thrown
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
232 $position=$position*3;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
233 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
234 return $self->get_Transcript->label($position,$firstlabel);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
235 # check for coord_start different
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
236 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
237
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
238 # returns position (aminoacids numbering) of a particular label
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
239 # used to return 0 for not in frame labels
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
240 # now returns the position anyway (after version 1.66)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
241 sub position {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
242 my ($self,$label)=@_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
243 my $firstlabel=$self->coordinate_start; # this is in_frame checked
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
244 my $position=$self->get_Transcript->position($label,$firstlabel);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
245 use integer;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
246 my $modulus=$position % 3;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
247 if ($position == 0) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
248 return (0);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
249 } elsif ($position > 0) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
250 if ($modulus != 1) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
251 $self->warn("Attention! Label $label is not in frame ".
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
252 "(1st position of triplet) with protein",1) if $self->verbose > 0; # ignorable
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
253 if ($modulus == 2) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
254 return ($position / 3 + 1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
255 } else { # i.e. modulus == 0
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
256 return ($position / 3);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
257 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
258 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
259 return ($position / 3 + 1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
260 } else { # pos < 0
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
261 if ($modulus != 0) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
262 $self->warn("Attention! Label $label is not in frame ".
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
263 "(1st position of triplet) with protein",1) if $self->verbose > 0; # ignorable
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
264 return ($position / 3 - 1); # ok for both other positions
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
265 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
266 return ($position / 3);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
267 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
268 $self->throw( "WEIRD: execution shouldn't have reached here");
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
269 return (0); # this should never happen, but just in case
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
270 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
271
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
272 # note: it inherits subseq and labelsubseq from Transcript!
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
273
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
274 sub start {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
275 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
276 return ($self->{'transcript'}->start);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
277 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
278
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
279 sub end {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
280 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
281 return ($self->{'transcript'}->end);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
282 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
283
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
284 =head2 aa_ranges
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
285
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
286 Title : aa_ranges
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
287 Usage : @proteinfeatures = $translation->aa_ranges()
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
288 Function: to retrieve all the LiveSeq AARange objects attached to a
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
289 Translation, usually created out of a SwissProt database entry
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
290 crossreferenced from an EMBL CDS feature.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
291 Returns : an array
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
292 Args : none
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
293
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
294 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
295
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
296 # returns an array of obj_ref of AARange objects attached to the Translation
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
297 sub aa_ranges {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
298 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
299 return ($self->{'aa_ranges'});
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
300 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
301
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
302 sub translation_table {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
303 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
304 $self->get_Transcript->translation_table(@_);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
305 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
306
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
307 # returns all aminoacids "affected" i.e. all aminoacids coded by any codon
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
308 # "touched" by the range selected between the labels, even if only partially.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
309
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
310 # it's not optimized for performance but it's useful
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
311
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
312 sub labelsubseq {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
313 my ($self,$start,$length,$end)=@_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
314 my ($pos1,$pos2);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
315 my $transcript=$self->get_Transcript;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
316 if ($start) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
317 unless ($transcript->valid($start)) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
318 $self->warn("Start label not valid"); return (-1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
319 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
320 $pos1=$self->position($start);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
321 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
322 if ($end) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
323 if ($end == $start) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
324 $length=1;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
325 } else {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
326 unless ($transcript->valid($end)) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
327 $self->warn("End label not valid"); return (-1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
328 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
329 unless ($transcript->follows($start,$end) == 1) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
330 $self->warn("End label does not follow Start label!"); return (-1);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
331 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
332 $pos2=$self->position($end);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
333 $length=$pos2-$pos1+1;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
334 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
335 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
336 my $sequence=$self->seq;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
337 return (substr($sequence,$pos1-1,$length));
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
338 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
339
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
340 # return the offset in aminoacids from LiveSeq protein sequence and SwissProt
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
341 # sequence (usually as a result of an INIT_MET or a gap)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
342 sub offset {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
343 my $self=shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
344 return ($self->{'offset'});
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
345 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
346
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
347 1;