annotate variant_effect_predictor/Bio/LiveSeq/Translation.pm @ 0:1f6dce3d34e0

Uploaded
author mahtabm
date Thu, 11 Apr 2013 02:01:53 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: Translation.pm,v 1.12 2002/09/25 08:57:52 heikki Exp $
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 # bioperl module for Bio::LiveSeq::Translation
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5 # Cared for by Joseph Insana <insana@ebi.ac.uk> <jinsana@gmx.net>
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7 # Copyright Joseph Insana
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9 # You may distribute this module under the same terms as perl itself
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11 # POD documentation - main docs before the code
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13 =head1 NAME
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15 Bio::LiveSeq::Translation - Translation class for LiveSeq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19 #documentation needed
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21 =head1 DESCRIPTION
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23 This stores informations about aminoacids translations of transcripts.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24 The implementation is that a Translation object is the translation of
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25 a Transcript object, with different possibilities of manipulation,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26 different coordinate system and eventually its own ranges (protein domains).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28 =head1 AUTHOR - Joseph A.L. Insana
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30 Email: Insana@ebi.ac.uk, jinsana@gmx.net
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32 Address:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34 EMBL Outstation, European Bioinformatics Institute
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35 Wellcome Trust Genome Campus, Hinxton
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36 Cambs. CB10 1SD, United Kingdom
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38 =head1 APPENDIX
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40 The rest of the documentation details each of the object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41 methods. Internal methods are usually preceded with a _
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45 # Let the code begin...
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47 package Bio::LiveSeq::Translation;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48 $VERSION=1.8;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50 # Version history:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51 # Thu Mar 23 14:41:52 GMT 2000 v.1.0 begun
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52 # Sat Mar 25 04:08:59 GMT 2000 v 1.2 valid(), label(), position()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53 # Tue Mar 28 03:37:17 BST 2000 v 1.3 added inheritance from Transcript, subseq relies on it!
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54 # Fri Mar 31 16:53:53 BST 2000 v 1.4 new seq() function that checks for stop codons: it now returns only up to the stop but doesn't continue if stop not found
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55 # Fri Mar 31 18:45:07 BST 2000 v 1.41 now it asks for Transcript->downstream_seq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56 # Fri Mar 31 19:20:04 BST 2000 v 1.49 seq() now works correctly
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57 # Thu Apr 13 00:10:29 BST 2000 v 1.5 start and end now take the information from Transcript
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58 # Thu Apr 27 16:18:55 BST 2000 v 1.6 translation_table info added
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59 # Thu May 11 17:30:41 BST 2000 v 1.66 position method updated so to return a position also for labels not in frame (not at 1st triplet position)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60 # Mon May 22 14:59:14 BST 2000 v 1.7 labelsubseq added
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61 # Mon May 22 15:22:12 BST 2000 v 1.71 labelsubseq tweaked for cases where startlabel==endlabel (no useless follow() query!)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62 # Mon May 22 15:28:49 BST 2000 v 1.74 modified seq() so that the "*" is printed
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63 # Wed Jun 7 04:02:18 BST 2000 v 1.75 added offset()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64 # Thu Jun 29 15:10:22 BST 2000 v 1.76 bug corrected for elongation mutations, if stop codon is not found downstream
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65 # Wed Mar 28 16:37:37 BST 2001 v 1.8 carp -> warn,throw (coded methods in SeqI)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68 #use Carp qw(croak carp cluck);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69 use vars qw($VERSION @ISA);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70 use Bio::LiveSeq::SeqI 3.2; # uses SeqI, inherits from it
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71 use Bio::PrimarySeq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72 @ISA=qw(Bio::LiveSeq::Transcript );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75 =head2 new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77 Title : new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78 Usage : $protein = Bio::LiveSeq::Translation->new(-transcript => $transcr);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80 Function: generates a new Bio::LiveSeq::Translation
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81 Returns : reference to a new object of class Translation
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82 Errorcode -1
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83 Args : reference to an object of class Transcript
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87 sub new {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88 my ($thing, %args) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89 my $class = ref($thing) || $thing;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90 my ($obj,%translation);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92 my $transcript=$args{-transcript};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94 $obj = \%translation;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95 $obj = bless $obj, $class;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97 unless ($transcript) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98 $obj->throw("$class not initialised because no -transcript given");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100 unless (ref($transcript) eq "Bio::LiveSeq::Transcript") {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101 $obj->throw("$class not initialised because no object of class Transcript given");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104 #my $startbase = $transcript->start;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105 #my $endbase = $transcript->end;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106 my $strand = $transcript->strand;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107 my $seq = $transcript->{'seq'};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109 $obj->{'strand'}=$strand;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110 $obj->{'seq'}=$seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111 $obj->{'transcript'}=$transcript;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112 $obj->{'alphabet'}="protein";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114 $transcript->{'translation'}=$obj;# set the Translation ref into its Transcript
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115 return $obj;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118 =head2 get_Transcript
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120 Title : valid
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121 Usage : $transcript = $obj->get_Transcript()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122 Function: retrieves the reference to the object of class Transcript (if any)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123 attached to a LiveSeq object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124 Returns : object reference
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129 sub get_Transcript {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131 return ($self->{'transcript'});
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134 # These get redefined here, overriding the SeqI ones
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136 sub change {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137 my ($self)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 $self->warn("Cannot change a Translation object!\nChanges have to be issued at the nucleotide level!");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139 return (-1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141 sub positionchange {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142 my ($self)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143 $self->warn("Cannot change a Translation object!\nChanges have to be issued at the nucleotide level!");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144 return (-1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146 sub labelchange {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147 my ($self)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148 $self->warn("Cannot change a Translation object!\nChanges have to be issued at the nucleotide level!");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149 return (-1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152 # this just returns the translation of the transcript, without checking for
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
153 # stop codons
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
154 sub transl_seq {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
155 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
156 my $transcript=$self->get_Transcript;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
157 my $translation=$transcript->translate(undef, undef, undef,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
158 $self->translation_table)->seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
159 return $translation;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
160 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
161
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
162 # version 1.74 -> now the "*" is printed
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
163 sub seq {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
164 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
165 my $proteinseq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
166 my $transcript=$self->get_Transcript;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
167 my $translation=$transcript->translate(undef, undef, undef,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
168 $self->translation_table)->seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
169 my $stop_pos=index($translation,"*");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
170 if ($stop_pos == -1) { # no stop present, continue downstream
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
171 my $downstreamseq=$transcript->downstream_seq();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
172 #carp "the downstream is: $downstreamseq"; # debug
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
173 my $cdnaseq=$transcript->seq();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
174 my $extendedseq = new Bio::PrimarySeq(-seq => "$cdnaseq$downstreamseq",
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
175 -alphabet => 'dna'
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
176 );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
177
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
178 $translation=$extendedseq->translate(undef, undef, undef,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
179 $self->translation_table)->seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
180 #carp "the new translation is: $translation"; # debug
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
181 $stop_pos=index($translation,"*");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
182 if ($stop_pos == -1) { # still no stop present, return warning
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
183 $self->warn("Warning: no stop codon found in the retrieved sequence downstream of Transcript ",1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
184 undef $stop_pos;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
185 $proteinseq=$translation;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
186 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
187 $proteinseq=substr($translation,0,$stop_pos+1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
188 #carp "the new stopped translation is: $proteinseq, because the stop is at position $stop_pos"; # debug
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
189 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
190 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
191 $proteinseq=substr($translation,0,$stop_pos+1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
192 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
193 return $proteinseq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
194 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
195
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
196 sub length {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
197 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
198 my $seq=$self->seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
199 my $length=length($seq);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
200 return $length;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
201 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
202
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
203 sub all_labels {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
204 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
205 return $self->get_Transcript->all_labels;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
206 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
207
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
208 # counts in triplet. Only a label matching the beginning of a triplet coding
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
209 # for an aminoacid is considered valid when setting coordinate_start
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
210 # (i.e. only in frame!)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
211 sub valid {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
212 my ($self,$label)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
213 my $i;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
214 my @labels=$self->get_Transcript->all_labels;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
215 my $length=$#labels;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
216 while ($i <= $length) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
217 if ($label == $labels[$i]) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
218 return (1); # found
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
219 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
220 $i=$i+3;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
221 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
222 return (0); # not found
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
223 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
224
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
225 # returns the label to the first nucleotide of the triplet coding for $position aminoacid
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
226 sub label {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
227 my ($self,$position)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
228 my $firstlabel=$self->coordinate_start; # this is in_frame checked
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
229 if ($position > 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
230 $position=$position*3-2;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
231 } else { # if position = 0 this will be caught by Transcript, error thrown
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
232 $position=$position*3;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
233 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
234 return $self->get_Transcript->label($position,$firstlabel);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
235 # check for coord_start different
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
236 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
237
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
238 # returns position (aminoacids numbering) of a particular label
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
239 # used to return 0 for not in frame labels
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
240 # now returns the position anyway (after version 1.66)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
241 sub position {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
242 my ($self,$label)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
243 my $firstlabel=$self->coordinate_start; # this is in_frame checked
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
244 my $position=$self->get_Transcript->position($label,$firstlabel);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
245 use integer;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
246 my $modulus=$position % 3;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
247 if ($position == 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
248 return (0);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
249 } elsif ($position > 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
250 if ($modulus != 1) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
251 $self->warn("Attention! Label $label is not in frame ".
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
252 "(1st position of triplet) with protein",1) if $self->verbose > 0; # ignorable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
253 if ($modulus == 2) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
254 return ($position / 3 + 1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
255 } else { # i.e. modulus == 0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
256 return ($position / 3);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
257 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
258 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
259 return ($position / 3 + 1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
260 } else { # pos < 0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
261 if ($modulus != 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
262 $self->warn("Attention! Label $label is not in frame ".
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
263 "(1st position of triplet) with protein",1) if $self->verbose > 0; # ignorable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
264 return ($position / 3 - 1); # ok for both other positions
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
265 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
266 return ($position / 3);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
267 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
268 $self->throw( "WEIRD: execution shouldn't have reached here");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
269 return (0); # this should never happen, but just in case
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
270 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
271
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
272 # note: it inherits subseq and labelsubseq from Transcript!
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
273
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
274 sub start {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
275 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
276 return ($self->{'transcript'}->start);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
277 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
278
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
279 sub end {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
280 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
281 return ($self->{'transcript'}->end);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
282 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
283
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
284 =head2 aa_ranges
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
285
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
286 Title : aa_ranges
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
287 Usage : @proteinfeatures = $translation->aa_ranges()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
288 Function: to retrieve all the LiveSeq AARange objects attached to a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
289 Translation, usually created out of a SwissProt database entry
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
290 crossreferenced from an EMBL CDS feature.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
291 Returns : an array
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
292 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
293
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
294 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
295
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
296 # returns an array of obj_ref of AARange objects attached to the Translation
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
297 sub aa_ranges {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
298 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
299 return ($self->{'aa_ranges'});
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
300 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
301
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
302 sub translation_table {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
303 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
304 $self->get_Transcript->translation_table(@_);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
305 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
306
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
307 # returns all aminoacids "affected" i.e. all aminoacids coded by any codon
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
308 # "touched" by the range selected between the labels, even if only partially.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
309
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
310 # it's not optimized for performance but it's useful
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
311
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
312 sub labelsubseq {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
313 my ($self,$start,$length,$end)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
314 my ($pos1,$pos2);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
315 my $transcript=$self->get_Transcript;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
316 if ($start) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
317 unless ($transcript->valid($start)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
318 $self->warn("Start label not valid"); return (-1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
319 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
320 $pos1=$self->position($start);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
321 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
322 if ($end) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
323 if ($end == $start) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
324 $length=1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
325 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
326 unless ($transcript->valid($end)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
327 $self->warn("End label not valid"); return (-1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
328 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
329 unless ($transcript->follows($start,$end) == 1) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
330 $self->warn("End label does not follow Start label!"); return (-1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
331 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
332 $pos2=$self->position($end);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
333 $length=$pos2-$pos1+1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
334 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
335 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
336 my $sequence=$self->seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
337 return (substr($sequence,$pos1-1,$length));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
338 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
339
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
340 # return the offset in aminoacids from LiveSeq protein sequence and SwissProt
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
341 # sequence (usually as a result of an INIT_MET or a gap)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
342 sub offset {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
343 my $self=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
344 return ($self->{'offset'});
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
345 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
346
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
347 1;