annotate variant_effect_predictor/Bio/EnsEMBL/DBSQL/ProteinAlignFeatureAdaptor.pm @ 3:d30fa12e4cc5 default tip

Merge heads 2:a5976b2dce6f and 1:09613ce8151e which were created as a result of a recently fixed bug.
author devteam <devteam@galaxyproject.org>
date Mon, 13 Jan 2014 10:38:30 -0500
parents 1f6dce3d34e0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 =head1 LICENSE
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 Copyright (c) 1999-2012 The European Bioinformatics Institute and
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4 Genome Research Limited. All rights reserved.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 This software is distributed under a modified Apache license.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7 For license details, please see
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9 http://www.ensembl.org/info/about/code_licence.html
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11 =head1 CONTACT
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13 Please email comments or questions to the public Ensembl
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14 developers list at <dev@ensembl.org>.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16 Questions may also be sent to the Ensembl help desk at
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17 <helpdesk@ensembl.org>.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21 =head1 NAME
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23 Bio::EnsEMBL::DBSQL::ProteinAlignFeatureAdaptor -
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24 Adaptor for ProteinAlignFeatures
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28 $pafa =
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29 $registry->get_adaptor( 'Human', 'Core', 'ProteinAlignFeature' );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31 my @features = @{ $pafa->fetch_all_by_Slice($slice) };
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33 $pafa->store(@features);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35 =head1 METHODS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40 package Bio::EnsEMBL::DBSQL::ProteinAlignFeatureAdaptor;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41 use vars qw(@ISA);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44 use Bio::EnsEMBL::DBSQL::BaseAlignFeatureAdaptor;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45 use Bio::EnsEMBL::DnaPepAlignFeature;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46 use Bio::EnsEMBL::Utils::Exception qw(throw warning);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47 @ISA = qw(Bio::EnsEMBL::DBSQL::BaseAlignFeatureAdaptor);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50 =head2 store
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52 Arg [1] : list of Bio::EnsEMBL::DnaPepAlignFeature @feats
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53 Example : $protein_align_feature_adaptor->store(@feats);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54 Description: stores a list of ProteinAlignFeatures in the database
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55 Returntype : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56 Exceptions : throw if any of the provided features cannot be stored
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57 which may occur if:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58 * The feature does not have an associated Slice
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59 * The feature does not have an associated analysis
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60 * The Slice the feature is associated with is on a seq_region
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61 unknown to this database
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62 A warning is given if:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63 * The feature has already been stored in this db
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64 Caller : Pipeline
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65 Status : Stable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70 sub store{
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71 my ($self, @feats) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73 throw("Must call store with features") if( scalar(@feats) == 0 );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75 my @tabs = $self->_tables;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76 my ($tablename) = @{$tabs[0]};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78 my $db = $self->db();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79 my $slice_adaptor = $db->get_SliceAdaptor();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80 my $analysis_adaptor = $db->get_AnalysisAdaptor();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82 my $sth = $self->prepare(
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83 "INSERT INTO $tablename (seq_region_id, seq_region_start, seq_region_end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84 seq_region_strand, hit_start, hit_end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85 hit_name, cigar_line,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86 analysis_id, score, evalue, perc_ident, external_db_id, hcoverage)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87 VALUES (?,?,?,?,?,?,?,?,?,?, ?, ?, ?, ?)");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89 FEATURE: foreach my $feat ( @feats ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90 if( !ref $feat || !$feat->isa("Bio::EnsEMBL::DnaPepAlignFeature") ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91 throw("feature must be a Bio::EnsEMBL::DnaPepAlignFeature,"
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92 . " not a [".ref($feat)."].");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95 if($feat->is_stored($db)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96 warning("PepDnaAlignFeature [".$feat->dbID."] is already stored" .
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97 " in this database.");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98 next FEATURE;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101 #sanity check the hstart and hend
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102 my $hstart = $feat->hstart();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103 my $hend = $feat->hend();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104 $self->_check_start_end_strand($hstart,$hend,1);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106 my $cigar_string = $feat->cigar_string();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107 if(!$cigar_string) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108 $cigar_string = $feat->length() . 'M';
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109 warning("DnaPepAlignFeature does not define a cigar_string.\n" .
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110 "Assuming ungapped block with cigar_string=$cigar_string\n");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113 my $hseqname = $feat->hseqname();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114 if(!$hseqname) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115 throw("DnaPepAlignFeature must define an hseqname.");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118 if(!defined($feat->analysis)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119 throw("An analysis must be attached to the features to be stored.");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122 #store the analysis if it has not been stored yet
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123 if(!$feat->analysis->is_stored($db)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124 $analysis_adaptor->store($feat->analysis());
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127 my $slice = $feat->slice();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128 if(!defined($slice) || !($slice->isa("Bio::EnsEMBL::Slice") or $slice->isa('Bio::EnsEMBL::LRGSlice')) ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129 throw("A slice must be attached to the features to be stored.");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132 my $original = $feat;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133 my $seq_region_id;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134 ($feat, $seq_region_id) = $self->_pre_store($feat);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136 $sth->bind_param(1,$seq_region_id,SQL_INTEGER);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137 $sth->bind_param(2,$feat->start,SQL_INTEGER);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 $sth->bind_param(3,$feat->end,SQL_INTEGER);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139 $sth->bind_param(4,$feat->strand,SQL_TINYINT);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 $sth->bind_param(5,$feat->hstart,SQL_INTEGER);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141 $sth->bind_param(6,$feat->hend,SQL_INTEGER);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142 $sth->bind_param(7,$feat->hseqname,SQL_VARCHAR);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143 $sth->bind_param(8,$feat->cigar_string,SQL_LONGVARCHAR);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144 $sth->bind_param(9,$feat->analysis->dbID,SQL_INTEGER);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145 $sth->bind_param(10,$feat->score,SQL_DOUBLE);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146 $sth->bind_param(11,$feat->p_value,SQL_DOUBLE);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147 $sth->bind_param(12,$feat->percent_id,SQL_REAL);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148 $sth->bind_param(13,$feat->external_db_id,SQL_INTEGER);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149 $sth->bind_param(14,$feat->hcoverage,SQL_DOUBLE);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151 $sth->execute();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152 $original->dbID($sth->{'mysql_insertid'});
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
153 $original->adaptor($self);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
154 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
155
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
156 $sth->finish();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
157 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
158
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
159
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
160 =head2 _objs_from_sth
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
161
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
162 Arg [1] : DBI statement handle $sth
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
163 an exectuted DBI statement handle generated by selecting
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
164 the columns specified by _columns() from the table specified
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
165 by _table()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
166 Example : @dna_dna_align_feats = $self->_obj_from_hashref
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
167 Description: PROTECTED implementation of superclass abstract method.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
168 Creates DnaDnaAlignFeature objects from a DBI hashref
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
169 Returntype : listref of Bio::EnsEMBL::ProteinAlignFeatures
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
170 Exceptions : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
171 Caller : Bio::EnsEMBL::BaseFeatureAdaptor::generic_fetch
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
172 Status : Stable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
173
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
174 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
175
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
176 sub _objs_from_sth {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
177 my ($self, $sth, $mapper, $dest_slice) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
178
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
179 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
180 # This code is ugly because an attempt has been made to remove as many
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
181 # function calls as possible for speed purposes. Thus many caches and
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
182 # a fair bit of gymnastics is used.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
183 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
184
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
185 my $sa = $self->db()->get_SliceAdaptor();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
186 my $aa = $self->db->get_AnalysisAdaptor();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
187
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
188 my @features;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
189 my %analysis_hash;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
190 my %slice_hash;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
191 my %sr_name_hash;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
192 my %sr_cs_hash;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
193
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
194 my ($protein_align_feature_id, $seq_region_id, $seq_region_start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
195 $seq_region_end, $analysis_id, $seq_region_strand, $hit_start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
196 $hit_end, $hit_name, $cigar_line, $evalue, $perc_ident, $score,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
197 $external_db_id, $hcoverage, $external_db_name, $external_display_db_name );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
198
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
199 $sth->bind_columns(\$protein_align_feature_id, \$seq_region_id,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
200 \$seq_region_start,\$seq_region_end, \$analysis_id,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
201 \$seq_region_strand, \$hit_start,\$hit_end, \$hit_name,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
202 \$cigar_line, \$evalue, \$perc_ident, \$score,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
203 \$external_db_id, \$hcoverage, \$external_db_name, \$external_display_db_name );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
204
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
205 my $asm_cs;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
206 my $cmp_cs;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
207 my $asm_cs_vers;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
208 my $asm_cs_name;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
209 my $cmp_cs_vers;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
210 my $cmp_cs_name;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
211 if($mapper) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
212 $asm_cs = $mapper->assembled_CoordSystem();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
213 $cmp_cs = $mapper->component_CoordSystem();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
214 $asm_cs_name = $asm_cs->name();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
215 $asm_cs_vers = $asm_cs->version();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
216 $cmp_cs_name = $cmp_cs->name();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
217 $cmp_cs_vers = $cmp_cs->version();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
218 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
219
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
220 my $dest_slice_start;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
221 my $dest_slice_end;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
222 my $dest_slice_strand;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
223 my $dest_slice_length;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
224 my $dest_slice_sr_name;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
225 my $dest_slice_sr_id;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
226 if($dest_slice) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
227 $dest_slice_start = $dest_slice->start();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
228 $dest_slice_end = $dest_slice->end();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
229 $dest_slice_strand = $dest_slice->strand();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
230 $dest_slice_length = $dest_slice->length();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
231 $dest_slice_sr_name = $dest_slice->seq_region_name();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
232 $dest_slice_sr_id = $dest_slice->get_seq_region_id();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
233 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
234
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
235 FEATURE: while($sth->fetch()) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
236 #get the analysis object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
237 my $analysis = $analysis_hash{$analysis_id} ||=
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
238 $aa->fetch_by_dbID($analysis_id);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
239
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
240 #get the slice object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
241 my $slice = $slice_hash{"ID:".$seq_region_id};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
242
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
243 if(!$slice) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
244 $slice = $sa->fetch_by_seq_region_id($seq_region_id);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
245 $slice_hash{"ID:".$seq_region_id} = $slice;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
246 $sr_name_hash{$seq_region_id} = $slice->seq_region_name();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
247 $sr_cs_hash{$seq_region_id} = $slice->coord_system();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
248 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
249
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
250 my $sr_name = $sr_name_hash{$seq_region_id};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
251 my $sr_cs = $sr_cs_hash{$seq_region_id};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
252 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
253 # remap the feature coordinates to another coord system
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
254 # if a mapper was provided
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
255 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
256 if($mapper) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
257
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
258 if (defined $dest_slice && $mapper->isa('Bio::EnsEMBL::ChainedAssemblyMapper') ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
259 ( $seq_region_id, $seq_region_start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
260 $seq_region_end, $seq_region_strand )
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
261 =
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
262 $mapper->map( $sr_name, $seq_region_start, $seq_region_end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
263 $seq_region_strand, $sr_cs, 1, $dest_slice);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
264
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
265 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
266
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
267 ( $seq_region_id, $seq_region_start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
268 $seq_region_end, $seq_region_strand )
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
269 =
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
270 $mapper->fastmap( $sr_name, $seq_region_start, $seq_region_end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
271 $seq_region_strand, $sr_cs );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
272 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
273
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
274 #skip features that map to gaps or coord system boundaries
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
275 next FEATURE if(!defined($seq_region_id));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
276
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
277 # #get a slice in the coord system we just mapped to
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
278 # if($asm_cs == $sr_cs || ($cmp_cs != $sr_cs && $asm_cs->equals($sr_cs))) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
279 $slice = $slice_hash{"ID:".$seq_region_id} ||=
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
280 $sa->fetch_by_seq_region_id($seq_region_id);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
281 # } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
282 # $slice = $slice_hash{"ID:".$seq_region_id} ||=
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
283 # $sa->fetch_by_seq_region_id($asm_cs_name, $sr_name, undef, undef, undef,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
284 # $asm_cs_vers);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
285 # }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
286 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
287
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
288 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
289 # If a destination slice was provided convert the coords
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
290 # If the dest_slice starts at 1 and is foward strand, nothing needs doing
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
291 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
292 if($dest_slice) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
293 if($dest_slice_start != 1 || $dest_slice_strand != 1) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
294 if($dest_slice_strand == 1) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
295 $seq_region_start = $seq_region_start - $dest_slice_start + 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
296 $seq_region_end = $seq_region_end - $dest_slice_start + 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
297 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
298 my $tmp_seq_region_start = $seq_region_start;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
299 $seq_region_start = $dest_slice_end - $seq_region_end + 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
300 $seq_region_end = $dest_slice_end - $tmp_seq_region_start + 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
301 $seq_region_strand *= -1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
302 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
303 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
304
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
305 #throw away features off the end of the requested slice
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
306 if($seq_region_end < 1 || $seq_region_start > $dest_slice_length ||
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
307 ( $dest_slice_sr_id ne $seq_region_id )) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
308 next FEATURE;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
309 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
310 $slice = $dest_slice;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
311 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
312
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
313 # Finally, create the new ProteinAlignFeature.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
314 push(
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
315 @features,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
316 $self->_create_feature_fast(
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
317 'Bio::EnsEMBL::DnaPepAlignFeature', {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
318 'slice' => $slice,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
319 'start' => $seq_region_start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
320 'end' => $seq_region_end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
321 'strand' => $seq_region_strand,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
322 'hseqname' => $hit_name,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
323 'hstart' => $hit_start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
324 'hend' => $hit_end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
325 'hstrand' => 1, # dna_pep_align features
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
326 # are always hstrand 1
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
327 'score' => $score,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
328 'p_value' => $evalue,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
329 'percent_id' => $perc_ident,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
330 'cigar_string' => $cigar_line,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
331 'analysis' => $analysis,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
332 'adaptor' => $self,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
333 'dbID' => $protein_align_feature_id,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
334 'external_db_id' => $external_db_id,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
335 'hcoverage' => $hcoverage,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
336 'dbname' => $external_db_name,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
337 'db_display_name' => $external_display_db_name
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
338 } ) );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
339
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
340 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
341
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
342 return \@features;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
343 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
344
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
345
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
346
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
347 sub _tables {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
348 my $self = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
349
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
350 return (['protein_align_feature', 'paf'], ['external_db','exdb']);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
351 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
352
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
353
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
354 sub _columns {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
355 my $self = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
356
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
357 #warning _objs_from_hashref method depends on ordering of this list
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
358 return qw( paf.protein_align_feature_id
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
359 paf.seq_region_id
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
360 paf.seq_region_start
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
361 paf.seq_region_end
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
362 paf.analysis_id
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
363 paf.seq_region_strand
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
364 paf.hit_start
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
365 paf.hit_end
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
366 paf.hit_name
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
367 paf.cigar_line
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
368 paf.evalue
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
369 paf.perc_ident
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
370 paf.score
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
371 paf.external_db_id
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
372 paf.hcoverage
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
373 exdb.db_name
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
374 exdb.db_display_name);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
375 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
376
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
377 sub _left_join{
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
378 return (['external_db',"exdb.external_db_id = paf.external_db_id"]);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
379 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
380
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
381 =head2 list_dbIDs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
382
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
383 Arg [1] : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
384 Example : @feature_ids = @{$protein_align_feature_adaptor->list_dbIDs()};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
385 Description: Gets an array of internal ids for all protein align
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
386 features in the current db
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
387 Arg[1] : <optional> int. not 0 for the ids to be sorted by the seq_region.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
388 Returntype : listref of ints
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
389 Exceptions : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
390 Caller : ?
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
391 Status : Stable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
392
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
393 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
394
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
395 sub list_dbIDs {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
396 my ($self,$ordered) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
397
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
398 return $self->_list_dbIDs("protein_align_feature", undef, $ordered);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
399 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
400
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
401
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
402
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
403
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
404
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
405
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
406 1;