annotate variant_effect_predictor/Bio/Biblio/IO.pm @ 0:2bc9b66ada89 draft default tip

Uploaded
author mahtabm
date Thu, 11 Apr 2013 06:29:17 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: IO.pm,v 1.8 2002/10/22 07:45:11 lapp Exp $
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
2 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
3 # BioPerl module for Bio::Biblio::IO
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
4 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
5 # Cared for by Martin Senger <senger@ebi.ac.uk>
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
6 # For copyright and disclaimer see below.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
7
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
8 # POD documentation - main docs before the code
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
9
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
10 =head1 NAME
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
11
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
12 Bio::Biblio::IO - Handling the bibliographic references
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
13
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
14 =head1 SYNOPSIS
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
15
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
16 use Bio::Biblio::IO;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
17
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
18 # getting citations from a file
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
19 $in = Bio::Biblio::IO->new ('-file' => 'myfile.xml' ,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
20 '-format' => 'medlinexml');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
21 --- OR ---
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
22
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
23 # getting citations from a string
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
24 $in = Bio::Biblio::IO->new ('-data' => '<MedlineCitation>...</MedlineCitation>' ,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
25 '-format' => 'medlinexml');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
26 --- OR ---
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
27
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
28 # getting citations from a string if IO::String is installed
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
29 use IO::String;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
30 $in = Bio::Biblio::IO->new ('-fh' => IO::String->new ($citation),
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
31 '-format' => 'medlinexml');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
32
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
33 $in = Bio::Biblio::IO->new(-fh => $io_handle , '-format' => 'medlinexml');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
34
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
35 --- OR ---
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
36
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
37 # getting citations from any IO handler
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
38 $in = Bio::Biblio::IO->new('-fh' => $io_handle ,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
39 '-format' => 'medlinexml');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
40
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
41
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
42 # now, having $in, we can read all citations
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
43 while ( my $citation = $in->next_bibref() ) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
44 &do_something_with_citation ($citation);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
45 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
46
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
47 --- OR ---
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
48
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
49 # again reading all citation but now a callback defined in your
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
50 # code is used (note that the reading starts already when new()
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
51 # is called)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
52 $io = new Bio::Biblio::IO ('-format' => 'medlinexml',
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
53 '-file' => $testfile,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
54 '-callback' => \&callback);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
55 sub callback {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
56 my $citation = shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
57 print $citation->{'_identifier'} . "\n";
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
58 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
59
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
60 Now, to actually get a citation in an XML format,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
61 use I<Bio::Biblio> module which returns an XML string:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
62
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
63 use Bio::Biblio;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
64 my $xml = new Bio::Biblio->get_by_id ('94033980');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
65 my $reader = Bio::Biblio::IO->new ('-data' => $xml,
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
66 '-format' => 'medlinexml');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
67
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
68 while (my $citation = $reader->next_bibref()) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
69 ... do something here with $citation
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
70 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
71
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
72 And, finally, the resulting citation can be received in different
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
73 output formats:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
74
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
75 $io = new Bio::Biblio::IO ('-format' => 'medlinexml',
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
76 '-result' => 'raw');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
77 --- OR ---
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
78
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
79 $io = new Bio::Biblio::IO ('-format' => 'medlinexml',
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
80 '-result' => 'medline2ref');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
81
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
82 --- OR ---
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
83
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
84 $io = new Bio::Biblio::IO ('-format' => 'pubmedxml',
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
85 '-result' => 'pubmed2ref');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
86
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
87 =head1 DESCRIPTION
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
88
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
89 Bio::Biblio::IO is a handler module for accessing bibliographic
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
90 citations. The citations can be in different formats - assuming that
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
91 there is a corresponding module knowing that format in Bio::Biblio::IO
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
92 directory (e.g. Bio::Biblio::IO::medlinexml). The format (and the
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
93 module name) is given by the argument I<-format>.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
94
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
95 Once an instance of C<Bio::Biblio::IO> class is available, the
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
96 citations can be read by calling repeatedly method I<next_bibref>:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
97
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
98 while (my $citation = $reader->next_bibref()) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
99 ... do something here with $citation
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
100 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
101
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
102 However, this may imply that all citations were already read into the
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
103 memory. If you expect a huge amount of citations to be read, you may
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
104 choose a I<callback> option. Your subroutine is specified in the
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
105 C<new()> method and is called everytime a new citation is available
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
106 (see an example above in SYNOPSIS).
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
107
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
108 The citations returned by I<next_bibref> or given to your callback
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
109 routine can be of different formats depending on the argument
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
110 I<-result>. One result type is I<raw> and it is represented by a
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
111 simple, not blessed hash table:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
112
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
113 $io = new Bio::Biblio::IO ('-result' => 'raw');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
114
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
115 What other result formats are available depends on the module who
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
116 reads the citations in the first place. At the moment, the following
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
117 ones are available:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
118
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
119 $io = new Bio::Biblio::IO ('-result' => 'medline2ref');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
120
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
121 This is a default result format for reading citations by the
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
122 I<medlinexml> module. The C<medlinexml> module is again the default
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
123 one. Which means that you can almost omit arguments (you still need to
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
124 say where the citations come from):
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
125
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
126 $io = new Bio::Biblio::IO ('-file' => 'data/medline_data.xml');
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
127
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
128 Another result format available is for PUBMED citations (which is a
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
129 super-set of the MEDLINE citations having few more tags):
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
130
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
131 $io = new Bio::Biblio::IO ('-format' => 'pubmedxml',
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
132 '-result' => 'pubmed2ref',
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
133 '-data' => $citation);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
134
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
135 Or, because C<pubmed2ref> is a default one for PUBMED citations, you can say just:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
136
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
137 $io = new Bio::Biblio::IO ('-format' => 'pubmedxml',
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
138 '-data' => $citation);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
139
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
140 Both C<medline2ref> and C<pubmed2ref> results are objects defined in
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
141 the directory C<Bio::Biblio>.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
142
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
143 =head1 SEE ALSO
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
144
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
145 =over
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
146
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
147 =item *
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
148
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
149 An example script I<examples/biblio.pl>. It has many options and its
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
150 own help. The relevant options to this IO module are I<-f>
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
151 (specifying what file to read) and I<-O> (specifying what result
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
152 format to achieve).
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
153
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
154 =item *
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
155
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
156 OpenBQS home page: http://industry.ebi.ac.uk/openBQS
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
157
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
158 =item *
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
159
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
160 Comments to the Perl client: http://industry.ebi.ac.uk/openBQS/Client_perl.html
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
161
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
162 =back
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
163
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
164 =head1 FEEDBACK
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
165
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
166 =head2 Mailing Lists
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
167
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
168 User feedback is an integral part of the evolution of this
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
169 and other Bioperl modules. Send your comments and suggestions preferably
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
170 to one of the Bioperl mailing lists.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
171 Your participation is much appreciated.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
172
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
173 bioperl-l@bioperl.org - General discussion
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
174 http://bioperl.org/MailList.shtml - About the mailing lists
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
175
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
176 =head2 Reporting Bugs
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
177
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
178 Report bugs to the Bioperl bug tracking system to help us keep track
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
179 the bugs and their resolution.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
180 Bug reports can be submitted via email or the web:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
181
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
182 bioperl-bugs@bioperl.org
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
183 http://bugzilla.bioperl.org/
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
184
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
185 =head1 AUTHOR
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
186
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
187 Martin Senger (senger@ebi.ac.uk)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
188
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
189 =head1 COPYRIGHT
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
190
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
191 Copyright (c) 2002 European Bioinformatics Institute. All Rights Reserved.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
192
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
193 This module is free software; you can redistribute it and/or modify
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
194 it under the same terms as Perl itself.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
195
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
196 =head1 DISCLAIMER
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
197
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
198 This software is provided "as is" without warranty of any kind.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
199
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
200 =head1 APPENDIX
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
201
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
202 The rest of the documentation details each of the object
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
203 methods. Internal methods are preceded with a _
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
204
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
205 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
206
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
207
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
208 # Let the code begin...
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
209
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
210 package Bio::Biblio::IO;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
211
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
212 use strict;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
213 use vars qw(@ISA);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
214
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
215 use Bio::Root::Root;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
216 use Bio::Root::IO;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
217 use Symbol();
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
218
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
219 @ISA = qw(Bio::Root::Root Bio::Root::IO);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
220
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
221 my $entry = 0;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
222
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
223 sub new {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
224 my ($caller, @args) = @_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
225 my $class = ref ($caller) || $caller;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
226
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
227 # if $caller is an object, or if it is an underlying
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
228 # 'real-work-doing' class (e.g. Bio::Biblio::IO::medlinexml) then
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
229 # we want to call SUPER to create and bless an object
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
230 if( $class =~ /Bio::Biblio::IO::(\S+)/ ) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
231 my ($self) = $class->SUPER::new (@args);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
232 $self->_initialize (@args);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
233 return $self;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
234
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
235 # this is called only the first time when somebody calls: 'new
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
236 # Bio::Biblio::IO (...)', and it actually loads a 'real-work-doing'
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
237 # module and call this new() method again (unless the loaded
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
238 # module has its own new() method)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
239 } else {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
240 my %param = @args;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
241 @param{ map { lc $_ } keys %param } = values %param; # lowercase keys
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
242 my $format = $param{'-format'} ||
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
243 $class->_guess_format( $param{-file} || $ARGV[0] ) ||
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
244 'medlinexml';
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
245 $format = "\L$format"; # normalize capitalization to lower case
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
246
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
247 # load module with the real implementation - as defined in $format
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
248 return undef unless (&_load_format_module ($format));
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
249
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
250 # this will call this same method new() - but rather its
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
251 # upper (object) branche
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
252 return "Bio::Biblio::IO::$format"->new(@args);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
253 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
254 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
255
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
256 sub newFh {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
257 my $class = shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
258 return unless my $self = $class->new(@_);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
259 return $self->fh;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
260 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
261
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
262
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
263 sub fh {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
264 my $self = shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
265 my $class = ref($self) || $self;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
266 my $s = Symbol::gensym;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
267 tie $$s,$class,$self;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
268 return $s;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
269 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
270
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
271 # _initialize is chained for all Bio::Biblio::IO classes
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
272
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
273 sub _initialize {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
274 my ($self, @args) = @_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
275 # initialize the IO part
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
276 $self->_initialize_io (@args);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
277 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
278
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
279 =head2 next_bibref
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
280
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
281 Usage : $citation = stream->next_bibref
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
282 Function: Reads the next citation object from the stream and returns it.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
283 Returns : a Bio::Biblio::Ref citation object, or something else
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
284 (depending on the '-result' argument given in the 'new()'
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
285 method).
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
286 Args : none
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
287
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
288 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
289
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
290 sub next_bibref {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
291 my ($self) = shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
292 $self->throw ("Sorry, you cannot read from a generic Bio::Biblio::IO object.");
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
293 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
294
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
295 # -----------------------------------------------------------------------------
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
296
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
297 =head2 _load_format_module
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
298
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
299 Usage : $class->_load_format_module ($format)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
300 Returns : 1 on success, undef on failure
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
301 Args : 'format' should contain the last part of the
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
302 name of a module who does the real implementation
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
303
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
304 It does (in run-time) a similar thing as
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
305
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
306 require Bio::Biblio::IO::$format
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
307
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
308 It throws an exception if it fails to find and load the module
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
309 (for example, because of the compilation errors in the module).
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
310
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
311 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
312
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
313 sub _load_format_module {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
314 my ($format) = @_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
315 my ($module, $load, $m);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
316
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
317 $module = "_<Bio/Biblio/IO/$format.pm";
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
318 $load = "Bio/Biblio/IO/$format.pm";
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
319
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
320 return 1 if $main::{$module};
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
321 eval {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
322 require $load;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
323 };
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
324 if ( $@ ) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
325 Bio::Root::Root->throw (<<END);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
326 $load: $format cannot be found or loaded
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
327 Exception $@
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
328 For more information about the Biblio system please see the Bio::Biblio::IO docs.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
329 END
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
330 ;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
331 return;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
332 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
333 return 1;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
334 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
335
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
336 =head2 _guess_format
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
337
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
338 Usage : $class->_guess_format ($filename)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
339 Returns : string with a guessed format of the input data (e.g. 'medlinexml')
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
340 Args : a file name whose extension can help to guess its format
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
341
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
342 It makes an expert guess what kind of data are in the given file
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
343 (but be prepare that $filename may be empty).
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
344
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
345 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
346
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
347 sub _guess_format {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
348 my $class = shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
349 return unless $_ = shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
350 return 'medlinexml' if (/\.(xml|medlinexml)$/i);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
351 return;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
352 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
353
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
354 sub DESTROY {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
355 my $self = shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
356
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
357 $self->close();
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
358 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
359
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
360 sub TIEHANDLE {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
361 my ($class,$val) = @_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
362 return bless {'biblio' => $val}, $class;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
363 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
364
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
365 sub READLINE {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
366 my $self = shift;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
367 return $self->{'biblio'}->next_bibref() unless wantarray;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
368 my (@list, $obj);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
369 push @list, $obj while $obj = $self->{'biblio'}->next_bibref();
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
370 return @list;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
371 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
372
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
373 1;