annotate variant_effect_predictor/Bio/SeqFeature/Gene/Transcript.pm @ 3:d30fa12e4cc5 default tip

Merge heads 2:a5976b2dce6f and 1:09613ce8151e which were created as a result of a recently fixed bug.
author devteam <devteam@galaxyproject.org>
date Mon, 13 Jan 2014 10:38:30 -0500
parents 1f6dce3d34e0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: Transcript.pm,v 1.25 2002/12/29 09:37:51 lapp Exp $
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 # BioPerl module for Bio::SeqFeature::Gene::Transcript
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5 # Cared for by Hilmar Lapp <hlapp@gmx.net>
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7 # Copyright Hilmar Lapp
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9 # You may distribute this module under the same terms as perl itself
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11 # POD documentation - main docs before the code
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13 =head1 NAME
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15 Bio::SeqFeature::Gene::Transcript - A feature representing a transcript
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19 See documentation of methods.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21 =head1 DESCRIPTION
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23 A feature representing a transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26 =head1 FEEDBACK
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28 =head2 Mailing Lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30 User feedback is an integral part of the evolution of this
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31 and other Bioperl modules. Send your comments and suggestions preferably
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32 to one of the Bioperl mailing lists.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33 Your participation is much appreciated.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35 bioperl-l@bioperl.org - General discussion
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36 http://bio.perl.org/MailList.html - About the mailing lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38 =head2 Reporting Bugs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40 Report bugs to the Bioperl bug tracking system to help us keep track
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41 the bugs and their resolution.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42 Bug reports can be submitted via email or the web:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44 bioperl-bugs@bio.perl.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45 http://bugzilla.bioperl.org/
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47 =head1 AUTHOR - Hilmar Lapp
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49 Email hlapp@gmx.net
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51 Describe contact details here
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53 =head1 APPENDIX
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55 The rest of the documentation details each of the object methods. Internal methods are usually preceded with a _
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60 # Let the code begin...
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62 package Bio::SeqFeature::Gene::Transcript;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63 use vars qw(@ISA);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66 # Object preamble - inherits from Bio::Root::Object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68 use Bio::SeqFeature::Gene::TranscriptI;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69 use Bio::SeqFeature::Generic;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70 use Bio::PrimarySeq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72 @ISA = qw(Bio::SeqFeature::Generic Bio::SeqFeature::Gene::TranscriptI);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74 sub new {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75 my ($caller, @args) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76 my $self = $caller->SUPER::new(@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77 my ($primary) = $self->_rearrange([qw(PRIMARY)],@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79 $primary = 'transcript' unless $primary;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80 $self->primary_tag($primary);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81 $self->strand(0) if(! defined($self->strand()));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82 return $self;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86 =head2 promoters
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88 Title : promoters()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89 Usage : @proms = $transcript->promoters();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90 Function: Get the promoter features/sites of this transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92 Note that OO-modeling of regulatory elements is not stable yet.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93 This means that this method might change or even disappear in a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94 future release. Be aware of this if you use it.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96 Returns : An array of Bio::SeqFeatureI implementing objects representing the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97 promoter regions or sites.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98 Args :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103 sub promoters {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105 return $self->get_feature_type('Bio::SeqFeature::Gene::Promoter');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108 =head2 add_promoter
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110 Title : add_promoter()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111 Usage : $transcript->add_promoter($feature);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112 Function: Add a promoter feature/site to this transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115 Note that OO-modeling of regulatory elements is not stable yet.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116 This means that this method might change or even disappear in a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117 future release. Be aware of this if you use it.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119 Returns :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120 Args : A Bio::SeqFeatureI implementing object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125 sub add_promoter {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126 my ($self, $fea) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127 $self->_add($fea,'Bio::SeqFeature::Gene::Promoter');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130 =head2 flush_promoters
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132 Title : flush_promoters()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133 Usage : $transcript->flush_promoters();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134 Function: Remove all promoter features/sites from this transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136 Note that OO-modeling of regulatory elements is not stable yet.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137 This means that this method might change or even disappear in a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 future release. Be aware of this if you use it.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 Returns : the removed features as a list
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146 sub flush_promoters {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148 return $self->_flush('Bio::SeqFeature::Gene::Promoter');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151 =head2 exons
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
153 Title : exons()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
154 Usage : @exons = $gene->exons();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
155 ($inital_exon) = $gene->exons('Initial');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
156 Function: Get all exon features or all exons of specified type of this
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
157 transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
158
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
159 Exon type is treated as a case-insensitive regular expression and
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
160 is optional. For consistency, use only the following types:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
161 initial, internal, terminal.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
162
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
163 Returns : An array of Bio::SeqFeature::Gene::ExonI implementing objects.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
164 Args : An optional string specifying the primary_tag of the feature.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
165
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
166
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
167 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
168
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
169 sub exons {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
170 my ($self, $type) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
171 return $self->get_unordered_feature_type('Bio::SeqFeature::Gene::ExonI',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
172 $type);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
173 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
174
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
175 =head2 exons_ordered
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
176
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
177 Title : exons_ordered
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
178 Usage : @exons = $gene->exons_ordered();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
179 @exons = $gene->exons_ordered("Internal");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
180 Function: Get an ordered list of all exon features or all exons of specified
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
181 type of this transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
182
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
183 Exon type is treated as a case-insensitive regular expression and
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
184 is optional. For consistency, use only the following types:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
185
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
186 Returns : An array of Bio::SeqFeature::Gene::ExonI implementing objects.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
187 Args : An optional string specifying the primary_tag of the feature.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
188
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
189 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
190
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
191 sub exons_ordered {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
192 my ($self,$type) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
193 return $self->get_feature_type('Bio::SeqFeature::Gene::ExonI', $type);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
194 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
195
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
196 =head2 add_exon
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
197
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
198 Title : add_exon()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
199 Usage : $transcript->add_exon($exon,'initial');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
200 Function: Add a exon feature to this transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
201
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
202 The second argument denotes the type of exon. Mixing exons with and
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
203 without a type is likely to cause trouble in exons(). Either
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
204 leave out the type for all exons or for none.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
205
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
206 Presently, the following types are known: initial, internal,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
207 terminal, utr, utr5prime, and utr3prime (all case-insensitive).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
208 UTR should better be added through utrs()/add_utr().
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
209
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
210 If you wish to use other or additional types, you will almost
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
211 certainly have to call exon_type_sortorder() in order to replace
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
212 the default sort order, or mrna(), cds(), protein(), and exons()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
213 may yield unexpected results.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
214
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
215 Returns :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
216 Args : A Bio::SeqFeature::Gene::ExonI implementing object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
217 A string indicating the type of the exon (optional).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
218
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
219
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
220 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
221
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
222 sub add_exon {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
223 my ($self, $fea) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
224 if(! $fea->isa('Bio::SeqFeature::Gene::ExonI') ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
225 $self->throw("$fea does not implement Bio::SeqFeature::Gene::ExonI");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
226 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
227 $self->_add($fea,'Bio::SeqFeature::Gene::Exon');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
228 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
229
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
230 =head2 flush_exons
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
231
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
232 Title : flush_exons()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
233 Usage : $transcript->flush_exons();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
234 $transcript->flush_exons('terminal');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
235 Function: Remove all or a certain type of exon features from this transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
236
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
237 See add_exon() for documentation about types.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
238
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
239 Calling without a type will not flush UTRs. Call flush_utrs() for
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
240 this purpose.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
241 Returns : the deleted features as a list
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
242 Args : A string indicating the type of the exon (optional).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
243
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
244
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
245 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
246
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
247 sub flush_exons {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
248 my ($self, $type) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
249 return $self->_flush('Bio::SeqFeature::Gene::Exon',$type);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
250 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
251
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
252 =head2 introns
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
253
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
254 Title : introns()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
255 Usage : @introns = $gene->introns();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
256 Function: Get all intron features this gene structure.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
257
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
258 Note that this implementation generates these features
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
259 on-the-fly, that is, it simply treats all regions between
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
260 exons as introns, assuming that exons do not overlap. A
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
261 consequence is that a consistent correspondence between the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
262 elements in the returned array and the array that exons()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
263 returns will exist only if the exons are properly sorted
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
264 within their types (forward for plus- strand and reverse
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
265 for minus-strand transcripts). To ensure correctness the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
266 elements in the array returned will always be sorted.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
267
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
268 Returns : An array of Bio::SeqFeature::Gene::Intron objects representing
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
269 the intron regions.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
270 Args :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
271
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
272
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
273 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
274
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
275 sub introns {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
276 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
277 my @introns = ();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
278 my @exons = $self->exons();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
279 my ($strand, $rev_order);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
280
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
281 # if there's 1 or less exons we're done
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
282 return () unless($#exons > 0);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
283 # record strand and order (a minus-strand transcript is likely to have
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
284 # the exons stacked in reverse order)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
285 foreach my $exon (@exons) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
286 $strand = $exon->strand();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
287 last if $strand; # we're done if we've got 1 or -1
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
288 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
289 $rev_order = ($exons[0]->end() < $exons[1]->start() ? 0 : 1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
290
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
291 # Make sure exons are sorted. Because we assume they don't overlap, we
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
292 # simply sort by start position.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
293 if((! defined($strand)) || ($strand != -1) || (! $rev_order)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
294 # always sort forward for plus-strand transcripts, and for negative-
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
295 # strand transcripts that appear to be unsorted or forward sorted
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
296 @exons = map { $_->[0] } sort { $a->[1] <=> $b->[1] } map { [ $_, $_->start()] } @exons;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
297 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
298 # sort in reverse order for transcripts on the negative strand and
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
299 # found to be in reverse order
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
300 @exons = map { $_->[0] } sort { $b->[1] <=> $a->[1] } map { [ $_, $_->start()] } @exons;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
301 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
302 # loop over all intervening gaps
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
303 for(my $i = 0; $i < $#exons; $i++) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
304 my ($start, $end);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
305 my $intron;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
306
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
307 if(defined($exons[$i]->strand()) &&
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
308 (($exons[$i]->strand() * $strand) < 0)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
309 $self->throw("Transcript mixes plus and minus strand exons. ".
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
310 "Computing introns makes no sense then.");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
311 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
312 $start = $exons[$i+$rev_order]->end() + 1; # $i or $i+1
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
313 $end = $exons[$i+1-$rev_order]->start() - 1; # $i+1 or $i
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
314 $intron = Bio::SeqFeature::Gene::Intron->new(
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
315 '-start' => $start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
316 '-end' => $end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
317 '-strand' => $strand,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
318 '-primary' => 'intron',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
319 '-source' => ref($self));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
320 my $seq = $self->entire_seq();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
321 $intron->attach_seq($seq) if $seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
322 $intron->seq_id($self->seq_id());
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
323 push(@introns, $intron);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
324 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
325 return @introns;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
326 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
327
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
328 =head2 poly_A_site
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
329
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
330 Title : poly_A_site()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
331 Usage : $polyAsite = $transcript->poly_A_site();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
332 Function: Get/set the poly-adenylation feature/site of this transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
333 Returns : A Bio::SeqFeatureI implementing object representing the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
334 poly-adenylation region.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
335 Args : A Bio::SeqFeatureI implementing object on set, or FALSE to flush
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
336 a previously set object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
337
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
338
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
339 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
340
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
341 sub poly_A_site {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
342 my ($self, $fea) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
343 if ($fea) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
344 $self->_add($fea,'Bio::SeqFeature::Gene::Poly_A_site');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
345 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
346 return ($self->get_feature_type('Bio::SeqFeature::Gene::Poly_A_site'))[0];
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
347 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
348
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
349 =head2 utrs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
350
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
351 Title : utrs()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
352 Usage : @utr_sites = $transcript->utrs('utr3prime');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
353 @utr_sites = $transcript->utrs('utr5prime');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
354 @utr_sites = $transcript->utrs();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
355 Function: Get the features representing untranslated regions (UTR) of this
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
356 transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
357
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
358 You may provide an argument specifying the type of UTR. Currently
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
359 the following types are recognized: utr5prime utr3prime for UTR on the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
360 5' and 3' end of the CDS, respectively.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
361
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
362 Returns : An array of Bio::SeqFeature::Gene::UTR objects
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
363 representing the UTR regions or sites.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
364 Args : Optionally, either utr3prime, or utr5prime for the the type of UTR
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
365 feature.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
366
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
367
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
368 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
369
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
370 sub utrs {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
371 my ($self, $type) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
372 return $self->get_feature_type('Bio::SeqFeature::Gene::UTR',$type);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
373
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
374 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
375
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
376 =head2 add_utr
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
377
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
378 Title : add_utr()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
379 Usage : $transcript->add_utr($utrobj, 'utr3prime');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
380 $transcript->add_utr($utrobj);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
381 Function: Add a UTR feature/site to this transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
382
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
383 The second parameter is optional and denotes the type of the UTR
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
384 feature. Presently recognized types include 'utr5prime' and 'utr3prime'
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
385 for UTR on the 5' and 3' end of a gene, respectively.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
386
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
387 Calling this method is the same as calling
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
388 add_exon($utrobj, 'utr'.$type). In this sense a UTR object is a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
389 special exon object, which is transcribed, not spliced out, but
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
390 not translated.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
391
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
392 Note that the object supplied should return FALSE for is_coding().
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
393 Otherwise cds() and friends will become confused.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
394
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
395 Returns :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
396 Args : A Bio::SeqFeature::Gene::UTR implementing object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
397
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
398
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
399 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
400
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
401 sub add_utr {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
402 my ($self, $fea, $type) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
403 $self->_add($fea,'Bio::SeqFeature::Gene::UTR',$type);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
404 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
405
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
406 =head2 flush_utrs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
407
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
408 Title : flush_utrs()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
409 Usage : $transcript->flush_utrs();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
410 $transcript->flush_utrs('utr3prime');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
411 Function: Remove all or a specific type of UTR features/sites from this
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
412 transcript.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
413
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
414 Cf. add_utr() for documentation about recognized types.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
415 Returns : a list of the removed features
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
416 Args : Optionally a string denoting the type of UTR feature.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
417
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
418
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
419 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
420
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
421 sub flush_utrs {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
422 my ($self, $type) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
423 return $self->_flush('Bio::SeqFeature::Gene::UTR',$type);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
424 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
425
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
426 =head2 sub_SeqFeature
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
427
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
428 Title : sub_SeqFeature
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
429 Usage : @feats = $transcript->sub_SeqFeature();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
430 Function: Returns an array of all subfeatures.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
431
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
432 This method is defined in Bio::SeqFeatureI. We override this here
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
433 to include the exon etc features.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
434
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
435 Returns : An array Bio::SeqFeatureI implementing objects.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
436 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
437
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
438
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
439 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
440
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
441 sub sub_SeqFeature {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
442 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
443 my @feas;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
444
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
445 # get what the parent already has
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
446 @feas = $self->SUPER::sub_SeqFeature();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
447 # add the features we have in addition
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
448 push(@feas, $self->exons()); # this includes UTR features
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
449 push(@feas, $self->promoters());
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
450 push(@feas, $self->poly_A_site()) if($self->poly_A_site());
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
451 return @feas;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
452 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
453
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
454 =head2 flush_sub_SeqFeature
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
455
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
456 Title : flush_sub_SeqFeature
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
457 Usage : $transcript->flush_sub_SeqFeature();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
458 $transcript->flush_sub_SeqFeature(1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
459 Function: Removes all subfeatures.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
460
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
461 This method is overridden from Bio::SeqFeature::Generic to flush
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
462 all additional subfeatures like exons, promoters, etc., which is
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
463 almost certainly not what you want. To remove only features added
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
464 through $transcript->add_sub_SeqFeature($feature) pass any
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
465 argument evaluating to TRUE.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
466
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
467 Example :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
468 Returns : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
469 Args : Optionally, an argument evaluating to TRUE will suppress flushing
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
470 of all transcript-specific subfeatures (exons etc.).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
471
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
472
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
473 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
474
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
475 sub flush_sub_SeqFeature {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
476 my ($self,$fea_only) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
477
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
478 $self->SUPER::flush_sub_SeqFeature();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
479 if(! $fea_only) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
480 $self->flush_promoters();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
481 $self->flush_exons();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
482 $self->flush_utrs();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
483 $self->poly_A_site(0);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
484 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
485 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
486
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
487
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
488 =head2 cds
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
489
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
490 Title : cds
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
491 Usage : $seq = $transcript->cds();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
492 Function: Returns the CDS (coding sequence) as defined by the exons
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
493 of this transcript and the attached sequence.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
494
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
495 If no sequence is attached this method will return undef.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
496
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
497 Note that the implementation provided here returns a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
498 concatenation of all coding exons, thereby assuming that
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
499 exons do not overlap.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
500
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
501 Note also that you cannot set the CDS via this method. Set
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
502 a single CDS feature as a single exon, or derive your own
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
503 class if you want to store a predicted CDS.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
504
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
505 Example :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
506 Returns : A Bio::PrimarySeqI implementing object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
507 Args :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
508
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
509 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
510
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
511 sub cds {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
512 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
513 my @exons = $self->exons_ordered(); #this is always sorted properly according to strand
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
514 my $strand;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
515
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
516 return undef unless(@exons);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
517 # record strand (a minus-strand transcript must have the exons sorted in
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
518 # reverse order)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
519 foreach my $exon (@exons) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
520 if(defined($exon->strand()) && (! $strand)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
521 $strand = $exon->strand();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
522 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
523 if($exon->strand() && (($exon->strand() * $strand) < 0)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
524 $self->throw("Transcript mixes coding exons on plus and minus ".
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
525 "strand. This makes no sense.");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
526 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
527 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
528 my $cds = $self->_make_cds(@exons);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
529 return undef unless $cds;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
530 return Bio::PrimarySeq->new('-id' => $self->seq_id(),
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
531 '-seq' => $cds,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
532 '-alphabet' => "dna");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
533 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
534
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
535 =head2 protein
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
536
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
537 Title : protein()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
538 Usage : $protein = $transcript->protein();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
539 Function: Get the protein encoded by the transcript as a sequence object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
540
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
541 The implementation provided here simply calls translate() on the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
542 object returned by cds().
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
543
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
544 Returns : A Bio::PrimarySeqI implementing object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
545 Args :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
546
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
547
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
548 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
549
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
550 sub protein {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
551 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
552 my $seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
553
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
554 $seq = $self->cds();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
555 return $seq->translate() if $seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
556 return undef;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
557 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
558
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
559 =head2 mrna
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
560
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
561 Title : mrna()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
562 Usage : $mrna = $transcript->mrna();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
563 Function: Get the mRNA of the transcript as a sequence object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
564
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
565 The difference to cds() is that the sequence object returned by
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
566 this methods will also include UTR and the poly-adenylation site,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
567 but not promoter sequence (TBD).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
568
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
569 HL: do we really need this method?
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
570
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
571 Returns : A Bio::PrimarySeqI implementing object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
572 Args :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
573
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
574
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
575 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
576
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
577 sub mrna {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
578 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
579 my ($seq, $mrna, $elem);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
580
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
581 # get the coding part
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
582 $seq = $self->cds();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
583 if(! $seq) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
584 $seq = Bio::PrimarySeq->new('-id' => $self->seq_id(),
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
585 '-alphabet' => "rna",
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
586 '-seq' => "");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
587 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
588 # get and add UTR sequences
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
589 $mrna = "";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
590 foreach $elem ($self->utrs('utr5prime')) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
591 $mrna .= $elem->seq()->seq();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
592 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
593 $seq->seq($mrna . $seq->seq());
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
594 $mrna = "";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
595 foreach $elem ($self->utrs('utr3prime')) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
596 $mrna .= $elem->seq()->seq();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
597 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
598 $seq->seq($seq->seq() . $mrna);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
599 if($self->poly_A_site()) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
600 $seq->seq($seq->seq() . $self->poly_A_site()->seq()->seq());
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
601 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
602 return undef if($seq->length() == 0);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
603 return $seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
604 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
605
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
606 sub _get_typed_keys {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
607 my ($self, $keyprefix, $type) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
608 my @keys = ();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
609 my @feas = ();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
610
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
611 # make case-insensitive
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
612 $type = ($type ? lc($type) : "");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
613 # pull out all feature types that exist and match
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
614 @keys = grep { /^_$keyprefix$type/i; } (keys(%{$self}));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
615 return @keys;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
616 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
617
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
618 sub _make_cds {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
619 my ($self,@exons) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
620 my $cds = "";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
621
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
622 foreach my $exon (@exons) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
623 next if((! defined($exon->seq())) || (! $exon->is_coding()));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
624 my $phase = length($cds) % 3;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
625 # let's check the simple case
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
626 if((! defined($exon->frame())) || ($phase == $exon->frame())) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
627 # this one fits exactly, or frame of the exon is undefined (should
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
628 # we warn about that?); we bypass the $exon->cds() here (hmm,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
629 # not very clean style, but I don't see where this screws up)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
630 $cds .= $exon->seq()->seq();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
631 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
632 # this one is probably from exon shuffling and needs some work
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
633 my $seq = $exon->cds(); # now $seq is guaranteed to be in frame 0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
634 next if(! $seq);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
635 $seq = $seq->seq();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
636 # adjustment needed?
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
637 if($phase > 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
638 # how many Ns can we chop off the piece to be added?
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
639 my $n_crop = 0;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
640 if($seq =~ /^(n+)/i) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
641 $n_crop = length($1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
642 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
643 if($n_crop >= $phase) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
644 # chop off to match the phase
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
645 $seq = substr($seq, $phase);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
646 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
647 # fill in Ns
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
648 $seq = ("n" x (3-$phase)) . $seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
649 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
650 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
651 $cds .= $seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
652 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
653 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
654 return $cds;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
655 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
656
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
657 =head2 features
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
658
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
659 Title : features
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
660 Usage : my @features=$transcript->features;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
661 Function: returns all the features associated with this transcript
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
662 Returns : a list of SeqFeatureI implementing objects
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
663 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
664
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
665
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
666 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
667
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
668
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
669 sub features {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
670 my ($self) = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
671 $self->{'_features'} = [] unless defined $self->{'_features'};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
672 return @{$self->{'_features'}};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
673 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
674
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
675 =head2 features_ordered
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
676
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
677 Title : features_ordered
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
678 Usage : my @features=$transcript->features_ordered;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
679 Function: returns all the features associated with this transcript,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
680 in order by feature start, according to strand
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
681 Returns : a list of SeqFeatureI implementing objects
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
682 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
683
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
684
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
685 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
686
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
687 sub features_ordered{
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
688 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
689 return $self->_stranded_sort(@{$self->{'_features'}});
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
690 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
691
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
692
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
693 sub get_unordered_feature_type{
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
694 my ($self, $type, $pri)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
695 my @list;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
696 foreach ($self->features) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
697 if ($_->isa($type)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
698 if ($pri && $_->primary_tag !~ /$pri/i) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
699 next;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
700 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
701 push @list,$_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
702 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
703 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
704 return @list;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
705
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
706 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
707
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
708 sub get_feature_type {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
709 my ($self)=shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
710 return $self->_stranded_sort($self->get_unordered_feature_type(@_));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
711 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
712
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
713 #This was fixed by Gene Cutler - the indexing on the list being reversed
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
714 #fixed a bad bug. Thanks Gene!
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
715 sub _flush {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
716 my ($self, $type, $pri)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
717 my @list=$self->features;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
718 my @cut;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
719 for (reverse (0..$#list)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
720 if ($list[$_]->isa($type)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
721 if ($pri && $list[$_]->primary_tag !~ /$pri/i) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
722 next;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
723 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
724 push @cut, splice @list, $_, 1; #remove the element of $type from @list
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
725 #and return each of them in @cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
726 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
727 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
728 $self->{'_features'}=\@list;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
729 return reverse @cut;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
730 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
731
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
732 sub _add {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
733 my ($self, $fea, $type)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
734 require Bio::SeqFeature::Gene::Promoter;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
735 require Bio::SeqFeature::Gene::UTR;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
736 require Bio::SeqFeature::Gene::Exon;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
737 require Bio::SeqFeature::Gene::Intron;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
738 require Bio::SeqFeature::Gene::Poly_A_site;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
739
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
740 if(! $fea->isa('Bio::SeqFeatureI') ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
741 $self->throw("$fea does not implement Bio::SeqFeatureI");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
742 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
743 if(! $fea->isa($type) ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
744 $fea=$self->_new_of_type($fea,$type);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
745 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
746 if (! $self->strand) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
747 $self->strand($fea->strand);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
748 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
749 if ($self->strand * $fea->strand == -1) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
750 $self->throw("$fea is on opposite strand from $self");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
751 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
752 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
753
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
754 $self->_expand_region($fea);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
755 if(defined($self->entire_seq()) && (! defined($fea->entire_seq())) &&
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
756 $fea->can('attach_seq')) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
757 $fea->attach_seq($self->entire_seq());
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
758 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
759 if (defined $self->parent) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
760 $self->parent->_expand_region($fea);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
761 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
762 push(@{$self->{'_features'}}, $fea);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
763 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
764 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
765
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
766 sub _stranded_sort {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
767 my ($self,@list)=@_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
768 my $strand;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
769 foreach my $fea (@list) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
770 if($fea->strand()) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
771 # defined and != 0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
772 $strand = $fea->strand() if(! $strand);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
773 if(($fea->strand() * $strand) < 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
774 $strand = undef;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
775 last;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
776 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
777 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
778 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
779 if (defined $strand && $strand == - 1) { #reverse strand
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
780 return map { $_->[0] } sort {$b->[1] <=> $a->[1]} map { [$_, $_->start] } @list;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
781 } else { #undef or forward strand
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
782 return map { $_->[0] } sort {$a->[1] <=> $b->[1]} map { [$_, $_->start] } @list;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
783 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
784 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
785
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
786 sub _new_of_type {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
787 my ($self, $fea, $type, $pri)= @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
788 my $primary;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
789 if ($pri) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
790 $primary = $pri; #can set new primary tag if desired
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
791 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
792 ($primary) = $type =~ /.*::(.+)/; #or else primary is just end of type string
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
793 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
794 bless $fea,$type;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
795 $fea->primary_tag($primary);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
796 return $fea;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
797 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
798
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
799 1;