annotate variant_effect_predictor/Bio/DB/GenBank.pm @ 3:d30fa12e4cc5 default tip

Merge heads 2:a5976b2dce6f and 1:09613ce8151e which were created as a result of a recently fixed bug.
author devteam <devteam@galaxyproject.org>
date Mon, 13 Jan 2014 10:38:30 -0500
parents 1f6dce3d34e0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: GenBank.pm,v 1.47.2.2 2003/07/03 12:31:31 heikki Exp $
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 # BioPerl module for Bio::DB::GenBank
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5 # Cared for by Aaron Mackey <amackey@virginia.edu>
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7 # Copyright Aaron Mackey
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9 # You may distribute this module under the same terms as perl itself
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11 # POD documentation - main docs before the code
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13 # Added LWP support - Jason Stajich 2000-11-6
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14 # completely reworked by Jason Stajich 2000-12-8
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15 # to use WebDBSeqI
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17 # Added batch entrez back when determined that new entrez cgi will
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18 # essentially work (there is a limit to the number of characters in a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19 # GET request so I am not sure how we can get around this). The NCBI
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20 # Batch Entrez form has changed some and it does not support retrieval
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21 # of text only data. Still should investigate POST-ing (tried and
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22 # failed) a message to the entrez cgi to get around the GET
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23 # limitations.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25 =head1 NAME
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27 Bio::DB::GenBank - Database object interface to GenBank
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31 use Bio::DB::GenBank;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32 $gb = new Bio::DB::GenBank;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34 $seq = $gb->get_Seq_by_id('MUSIGHBA1'); # Unique ID
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36 # or ...
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38 $seq = $gb->get_Seq_by_acc('J00522'); # Accession Number
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39 $seq = $gb->get_Seq_by_version('J00522.1'); # Accession.version
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40 $seq = $gb->get_Seq_by_gi('405830'); # GI Number
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42 # get a stream via a query string
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43 my $query = Bio::DB::Query::GenBank->new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44 (-query =>'Oryza sativa[Organism] AND EST',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45 -reldate => '30',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46 -db => 'nucleotide');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47 my $seqio = $gb->get_Stream_by_query($query);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49 while( my $seq = $seqio->next_seq ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50 print "seq length is ", $seq->length,"\n";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53 # or ... best when downloading very large files, prevents
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54 # keeping all of the file in memory
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56 # also don't want features, just sequence so let's save bandwith
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57 # and request Fasta sequence
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58 $gb = new Bio::DB::GenBank(-retrievaltype => 'tempfile' ,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59 -format => 'Fasta');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60 my $seqio = $gb->get_Stream_by_acc(['AC013798', 'AC021953'] );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61 while( my $clone = $seqio->next_seq ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62 print "cloneid is ", $clone->display_id, " ",
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63 $clone->accession_number, "\n";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65 # note that get_Stream_by_version is not implemented
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67 =head1 DESCRIPTION
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69 Allows the dynamic retrieval of Sequence objects (Bio::Seq) from the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70 GenBank database at NCBI, via an Entrez query.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72 WARNING: Please do NOT spam the Entrez web server with multiple
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73 requests. NCBI offers Batch Entrez for this purpose.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75 Note that when querying for GenBank accessions starting with 'NT_' you
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76 will need to call $gb-E<gt>request_format('fasta') beforehand, because
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77 in GenBank format (the default) the sequence part will be left out
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78 (the reason is that NT contigs are rather annotation with references
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79 to clones).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81 Some work has been done to automatically detect and retrieve whole NT_
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82 clones when the data is in that format (NCBI RefSeq clones). More
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83 testing and feedback from users is needed to achieve a good fit of
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84 functionality and ease of use.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86 =head1 FEEDBACK
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88 =head2 Mailing Lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90 User feedback is an integral part of the evolution of this and other
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91 Bioperl modules. Send your comments and suggestions preferably to one
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92 of the Bioperl mailing lists. Your participation is much appreciated.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94 bioperl-l@bioperl.org - General discussion
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95 http://bioperl.org/MailList.shtml - About the mailing lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97 =head2 Reporting Bugs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99 Report bugs to the Bioperl bug tracking system to help us keep track
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100 the bugs and their resolution. Bug reports can be submitted via email
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101 or the web:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103 bioperl-bugs@bio.perl.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104 http://bugzilla.bioperl.org/
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106 =head1 AUTHOR - Aaron Mackey, Jason Stajich
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108 Email amackey@virginia.edu
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109 Email jason@bioperl.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111 =head1 APPENDIX
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113 The rest of the documentation details each of the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114 object methods. Internal methods are usually
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115 preceded with a _
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119 # Let the code begin...
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121 package Bio::DB::GenBank;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123 use vars qw(@ISA %PARAMSTRING $DEFAULTFORMAT $DEFAULTMODE);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124 use Bio::DB::NCBIHelper;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126 @ISA = qw(Bio::DB::NCBIHelper);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127 BEGIN {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128 $DEFAULTMODE = 'single';
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129 $DEFAULTFORMAT = 'gp';
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130 %PARAMSTRING = (
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131 'batch' => { 'db' => 'nucleotide',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132 'usehistory' => 'n',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133 'tool' => 'bioperl',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134 'retmode' => 'text'},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135 'query' => { 'usehistory' => 'y',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136 'tool' => 'bioperl',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137 'retmode' => 'text'},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 'gi' => { 'db' => 'nucleotide',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139 'usehistory' => 'n',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 'tool' => 'bioperl',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141 'retmode' => 'text'},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142 'version' => { 'db' => 'nucleotide',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143 'usehistory' => 'n',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144 'tool' => 'bioperl',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145 'retmode' => 'text'},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146 'single' => { 'db' => 'nucleotide',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147 'usehistory' => 'n',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148 'tool' => 'bioperl',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149 'retmode' => 'text'},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150 );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
153 # new is in NCBIHelper
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
154
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
155 # helper method to get db specific options
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
156
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
157 =head2 new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
158
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
159 Title : new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
160 Usage : $gb = Bio::DB::GenBank->new(@options)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
161 Function: Creates a new genbank handle
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
162 Returns : New genbank handle
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
163 Args : -delay number of seconds to delay between fetches (3s)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
164
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
165 NOTE: There are other options that are used internally. By NCBI policy, this
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
166 module introduces a 3s delay between fetches. If you are fetching multiple genbank
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
167 ids, it is a good idea to use get
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
168
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
169 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
170
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
171 =head2 get_params
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
172
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
173 Title : get_params
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
174 Usage : my %params = $self->get_params($mode)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
175 Function: Returns key,value pairs to be passed to NCBI database
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
176 for either 'batch' or 'single' sequence retrieval method
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
177 Returns : a key,value pair hash
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
178 Args : 'single' or 'batch' mode for retrieval
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
179
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
180 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
181
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
182 sub get_params {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
183 my ($self, $mode) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
184 return defined $PARAMSTRING{$mode} ?
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
185 %{$PARAMSTRING{$mode}} : %{$PARAMSTRING{$DEFAULTMODE}};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
186 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
187
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
188 # from Bio::DB::WebDBSeqI from Bio::DB::RandomAccessI
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
189
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
190 =head1 Routines Bio::DB::WebDBSeqI from Bio::DB::RandomAccessI
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
191
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
192 =head2 get_Seq_by_id
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
193
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
194 Title : get_Seq_by_id
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
195 Usage : $seq = $db->get_Seq_by_id('ROA1_HUMAN')
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
196 Function: Gets a Bio::Seq object by its name
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
197 Returns : a Bio::Seq object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
198 Args : the id (as a string) of a sequence
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
199 Throws : "id does not exist" exception
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
200
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
201 =head2 get_Seq_by_acc
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
202
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
203 Title : get_Seq_by_acc
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
204 Usage : $seq = $db->get_Seq_by_acc($acc);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
205 Function: Gets a Seq object by accession numbers
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
206 Returns : a Bio::Seq object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
207 Args : the accession number as a string
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
208 Note : For GenBank, this just calls the same code for get_Seq_by_id()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
209 Throws : "id does not exist" exception
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
210
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
211 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
212
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
213
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
214 sub get_Seq_by_acc {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
215 my ($self,$seqid) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
216 $self->SUPER::get_Seq_by_acc("gb|$seqid");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
217 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
218
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
219 =head2 get_Seq_by_gi
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
220
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
221 Title : get_Seq_by_gi
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
222 Usage : $seq = $db->get_Seq_by_gi('405830');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
223 Function: Gets a Bio::Seq object by gi number
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
224 Returns : A Bio::Seq object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
225 Args : gi number (as a string)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
226 Throws : "gi does not exist" exception
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
227
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
228 =head2 get_Seq_by_version
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
229
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
230 Title : get_Seq_by_version
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
231 Usage : $seq = $db->get_Seq_by_version('X77802.1');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
232 Function: Gets a Bio::Seq object by sequence version
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
233 Returns : A Bio::Seq object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
234 Args : accession.version (as a string)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
235 Throws : "acc.version does not exist" exception
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
236
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
237 =head1 Routines implemented by Bio::DB::NCBIHelper
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
238
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
239 =head2 get_Stream_by_query
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
240
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
241 Title : get_Stream_by_query
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
242 Usage : $seq = $db->get_Stream_by_query($query);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
243 Function: Retrieves Seq objects from Entrez 'en masse', rather than one
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
244 at a time. For large numbers of sequences, this is far superior
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
245 than get_Stream_by_[id/acc]().
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
246 Example :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
247 Returns : a Bio::SeqIO stream object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
248 Args : $query : An Entrez query string or a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
249 Bio::DB::Query::GenBank object. It is suggested that you
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
250 create a Bio::DB::Query::GenBank object and get the entry
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
251 count before you fetch a potentially large stream.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
252
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
253 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
254
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
255 =head2 get_Stream_by_id
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
256
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
257 Title : get_Stream_by_id
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
258 Usage : $stream = $db->get_Stream_by_id( [$uid1, $uid2] );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
259 Function: Gets a series of Seq objects by unique identifiers
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
260 Returns : a Bio::SeqIO stream object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
261 Args : $ref : a reference to an array of unique identifiers for
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
262 the desired sequence entries
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
263
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
264 =head2 get_Stream_by_acc
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
265
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
266 Title : get_Stream_by_acc
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
267 Usage : $seq = $db->get_Stream_by_acc([$acc1, $acc2]);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
268 Function: Gets a series of Seq objects by accession numbers
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
269 Returns : a Bio::SeqIO stream object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
270 Args : $ref : a reference to an array of accession numbers for
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
271 the desired sequence entries
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
272 Note : For GenBank, this just calls the same code for get_Stream_by_id()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
273
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
274 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
275
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
276 =head2 get_Stream_by_gi
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
277
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
278 Title : get_Stream_by_gi
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
279 Usage : $seq = $db->get_Seq_by_gi([$gi1, $gi2]);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
280 Function: Gets a series of Seq objects by gi numbers
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
281 Returns : a Bio::SeqIO stream object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
282 Args : $ref : a reference to an array of gi numbers for
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
283 the desired sequence entries
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
284 Note : For GenBank, this just calls the same code for get_Stream_by_id()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
285
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
286 =head2 get_Stream_by_batch
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
287
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
288 Title : get_Stream_by_batch
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
289 Usage : $seq = $db->get_Stream_by_batch($ref);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
290 Function: Retrieves Seq objects from Entrez 'en masse', rather than one
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
291 at a time.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
292 Example :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
293 Returns : a Bio::SeqIO stream object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
294 Args : $ref : either an array reference, a filename, or a filehandle
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
295 from which to get the list of unique ids/accession numbers.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
296
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
297 NOTE: This method is redundant and deprecated. Use get_Stream_by_id()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
298 instead.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
299
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
300 =head2 get_request
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
301
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
302 Title : get_request
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
303 Usage : my $url = $self->get_request
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
304 Function: HTTP::Request
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
305 Returns :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
306 Args : %qualifiers = a hash of qualifiers (ids, format, etc)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
307
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
308 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
309 __END__