annotate variant_effect_predictor/Bio/Biblio/IO.pm @ 1:d6778b5d8382 draft default tip

Deleted selected files
author willmclaren
date Fri, 03 Aug 2012 10:05:43 -0400
parents 21066c0abaf5
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
1 # $Id: IO.pm,v 1.8 2002/10/22 07:45:11 lapp Exp $
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
2 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
3 # BioPerl module for Bio::Biblio::IO
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
4 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
5 # Cared for by Martin Senger <senger@ebi.ac.uk>
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
6 # For copyright and disclaimer see below.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
7
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
8 # POD documentation - main docs before the code
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
9
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
10 =head1 NAME
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
11
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
12 Bio::Biblio::IO - Handling the bibliographic references
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
13
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
14 =head1 SYNOPSIS
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
15
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
16 use Bio::Biblio::IO;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
17
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
18 # getting citations from a file
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
19 $in = Bio::Biblio::IO->new ('-file' => 'myfile.xml' ,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
20 '-format' => 'medlinexml');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
21 --- OR ---
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
22
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
23 # getting citations from a string
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
24 $in = Bio::Biblio::IO->new ('-data' => '<MedlineCitation>...</MedlineCitation>' ,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
25 '-format' => 'medlinexml');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
26 --- OR ---
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
27
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
28 # getting citations from a string if IO::String is installed
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
29 use IO::String;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
30 $in = Bio::Biblio::IO->new ('-fh' => IO::String->new ($citation),
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
31 '-format' => 'medlinexml');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
32
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
33 $in = Bio::Biblio::IO->new(-fh => $io_handle , '-format' => 'medlinexml');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
34
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
35 --- OR ---
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
36
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
37 # getting citations from any IO handler
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
38 $in = Bio::Biblio::IO->new('-fh' => $io_handle ,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
39 '-format' => 'medlinexml');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
40
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
41
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
42 # now, having $in, we can read all citations
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
43 while ( my $citation = $in->next_bibref() ) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
44 &do_something_with_citation ($citation);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
45 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
46
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
47 --- OR ---
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
48
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
49 # again reading all citation but now a callback defined in your
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
50 # code is used (note that the reading starts already when new()
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
51 # is called)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
52 $io = new Bio::Biblio::IO ('-format' => 'medlinexml',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
53 '-file' => $testfile,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
54 '-callback' => \&callback);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
55 sub callback {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
56 my $citation = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
57 print $citation->{'_identifier'} . "\n";
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
58 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
59
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
60 Now, to actually get a citation in an XML format,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
61 use I<Bio::Biblio> module which returns an XML string:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
62
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
63 use Bio::Biblio;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
64 my $xml = new Bio::Biblio->get_by_id ('94033980');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
65 my $reader = Bio::Biblio::IO->new ('-data' => $xml,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
66 '-format' => 'medlinexml');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
67
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
68 while (my $citation = $reader->next_bibref()) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
69 ... do something here with $citation
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
70 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
71
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
72 And, finally, the resulting citation can be received in different
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
73 output formats:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
74
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
75 $io = new Bio::Biblio::IO ('-format' => 'medlinexml',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
76 '-result' => 'raw');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
77 --- OR ---
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
78
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
79 $io = new Bio::Biblio::IO ('-format' => 'medlinexml',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
80 '-result' => 'medline2ref');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
81
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
82 --- OR ---
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
83
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
84 $io = new Bio::Biblio::IO ('-format' => 'pubmedxml',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
85 '-result' => 'pubmed2ref');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
86
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
87 =head1 DESCRIPTION
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
88
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
89 Bio::Biblio::IO is a handler module for accessing bibliographic
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
90 citations. The citations can be in different formats - assuming that
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
91 there is a corresponding module knowing that format in Bio::Biblio::IO
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
92 directory (e.g. Bio::Biblio::IO::medlinexml). The format (and the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
93 module name) is given by the argument I<-format>.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
94
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
95 Once an instance of C<Bio::Biblio::IO> class is available, the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
96 citations can be read by calling repeatedly method I<next_bibref>:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
97
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
98 while (my $citation = $reader->next_bibref()) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
99 ... do something here with $citation
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
100 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
101
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
102 However, this may imply that all citations were already read into the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
103 memory. If you expect a huge amount of citations to be read, you may
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
104 choose a I<callback> option. Your subroutine is specified in the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
105 C<new()> method and is called everytime a new citation is available
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
106 (see an example above in SYNOPSIS).
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
107
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
108 The citations returned by I<next_bibref> or given to your callback
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
109 routine can be of different formats depending on the argument
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
110 I<-result>. One result type is I<raw> and it is represented by a
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
111 simple, not blessed hash table:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
112
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
113 $io = new Bio::Biblio::IO ('-result' => 'raw');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
114
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
115 What other result formats are available depends on the module who
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
116 reads the citations in the first place. At the moment, the following
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
117 ones are available:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
118
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
119 $io = new Bio::Biblio::IO ('-result' => 'medline2ref');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
120
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
121 This is a default result format for reading citations by the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
122 I<medlinexml> module. The C<medlinexml> module is again the default
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
123 one. Which means that you can almost omit arguments (you still need to
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
124 say where the citations come from):
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
125
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
126 $io = new Bio::Biblio::IO ('-file' => 'data/medline_data.xml');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
127
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
128 Another result format available is for PUBMED citations (which is a
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
129 super-set of the MEDLINE citations having few more tags):
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
130
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
131 $io = new Bio::Biblio::IO ('-format' => 'pubmedxml',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
132 '-result' => 'pubmed2ref',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
133 '-data' => $citation);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
134
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
135 Or, because C<pubmed2ref> is a default one for PUBMED citations, you can say just:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
136
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
137 $io = new Bio::Biblio::IO ('-format' => 'pubmedxml',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
138 '-data' => $citation);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
139
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
140 Both C<medline2ref> and C<pubmed2ref> results are objects defined in
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
141 the directory C<Bio::Biblio>.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
142
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
143 =head1 SEE ALSO
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
144
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
145 =over
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
146
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
147 =item *
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
148
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
149 An example script I<examples/biblio.pl>. It has many options and its
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
150 own help. The relevant options to this IO module are I<-f>
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
151 (specifying what file to read) and I<-O> (specifying what result
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
152 format to achieve).
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
153
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
154 =item *
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
155
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
156 OpenBQS home page: http://industry.ebi.ac.uk/openBQS
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
157
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
158 =item *
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
159
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
160 Comments to the Perl client: http://industry.ebi.ac.uk/openBQS/Client_perl.html
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
161
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
162 =back
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
163
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
164 =head1 FEEDBACK
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
165
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
166 =head2 Mailing Lists
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
167
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
168 User feedback is an integral part of the evolution of this
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
169 and other Bioperl modules. Send your comments and suggestions preferably
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
170 to one of the Bioperl mailing lists.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
171 Your participation is much appreciated.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
172
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
173 bioperl-l@bioperl.org - General discussion
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
174 http://bioperl.org/MailList.shtml - About the mailing lists
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
175
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
176 =head2 Reporting Bugs
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
177
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
178 Report bugs to the Bioperl bug tracking system to help us keep track
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
179 the bugs and their resolution.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
180 Bug reports can be submitted via email or the web:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
181
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
182 bioperl-bugs@bioperl.org
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
183 http://bugzilla.bioperl.org/
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
184
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
185 =head1 AUTHOR
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
186
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
187 Martin Senger (senger@ebi.ac.uk)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
188
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
189 =head1 COPYRIGHT
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
190
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
191 Copyright (c) 2002 European Bioinformatics Institute. All Rights Reserved.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
192
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
193 This module is free software; you can redistribute it and/or modify
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
194 it under the same terms as Perl itself.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
195
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
196 =head1 DISCLAIMER
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
197
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
198 This software is provided "as is" without warranty of any kind.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
199
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
200 =head1 APPENDIX
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
201
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
202 The rest of the documentation details each of the object
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
203 methods. Internal methods are preceded with a _
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
204
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
205 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
206
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
207
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
208 # Let the code begin...
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
209
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
210 package Bio::Biblio::IO;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
211
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
212 use strict;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
213 use vars qw(@ISA);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
214
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
215 use Bio::Root::Root;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
216 use Bio::Root::IO;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
217 use Symbol();
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
218
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
219 @ISA = qw(Bio::Root::Root Bio::Root::IO);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
220
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
221 my $entry = 0;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
222
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
223 sub new {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
224 my ($caller, @args) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
225 my $class = ref ($caller) || $caller;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
226
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
227 # if $caller is an object, or if it is an underlying
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
228 # 'real-work-doing' class (e.g. Bio::Biblio::IO::medlinexml) then
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
229 # we want to call SUPER to create and bless an object
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
230 if( $class =~ /Bio::Biblio::IO::(\S+)/ ) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
231 my ($self) = $class->SUPER::new (@args);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
232 $self->_initialize (@args);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
233 return $self;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
234
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
235 # this is called only the first time when somebody calls: 'new
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
236 # Bio::Biblio::IO (...)', and it actually loads a 'real-work-doing'
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
237 # module and call this new() method again (unless the loaded
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
238 # module has its own new() method)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
239 } else {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
240 my %param = @args;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
241 @param{ map { lc $_ } keys %param } = values %param; # lowercase keys
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
242 my $format = $param{'-format'} ||
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
243 $class->_guess_format( $param{-file} || $ARGV[0] ) ||
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
244 'medlinexml';
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
245 $format = "\L$format"; # normalize capitalization to lower case
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
246
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
247 # load module with the real implementation - as defined in $format
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
248 return undef unless (&_load_format_module ($format));
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
249
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
250 # this will call this same method new() - but rather its
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
251 # upper (object) branche
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
252 return "Bio::Biblio::IO::$format"->new(@args);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
253 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
254 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
255
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
256 sub newFh {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
257 my $class = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
258 return unless my $self = $class->new(@_);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
259 return $self->fh;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
260 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
261
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
262
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
263 sub fh {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
264 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
265 my $class = ref($self) || $self;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
266 my $s = Symbol::gensym;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
267 tie $$s,$class,$self;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
268 return $s;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
269 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
270
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
271 # _initialize is chained for all Bio::Biblio::IO classes
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
272
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
273 sub _initialize {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
274 my ($self, @args) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
275 # initialize the IO part
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
276 $self->_initialize_io (@args);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
277 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
278
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
279 =head2 next_bibref
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
280
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
281 Usage : $citation = stream->next_bibref
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
282 Function: Reads the next citation object from the stream and returns it.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
283 Returns : a Bio::Biblio::Ref citation object, or something else
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
284 (depending on the '-result' argument given in the 'new()'
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
285 method).
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
286 Args : none
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
287
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
288 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
289
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
290 sub next_bibref {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
291 my ($self) = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
292 $self->throw ("Sorry, you cannot read from a generic Bio::Biblio::IO object.");
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
293 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
294
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
295 # -----------------------------------------------------------------------------
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
296
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
297 =head2 _load_format_module
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
298
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
299 Usage : $class->_load_format_module ($format)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
300 Returns : 1 on success, undef on failure
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
301 Args : 'format' should contain the last part of the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
302 name of a module who does the real implementation
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
303
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
304 It does (in run-time) a similar thing as
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
305
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
306 require Bio::Biblio::IO::$format
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
307
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
308 It throws an exception if it fails to find and load the module
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
309 (for example, because of the compilation errors in the module).
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
310
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
311 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
312
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
313 sub _load_format_module {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
314 my ($format) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
315 my ($module, $load, $m);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
316
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
317 $module = "_<Bio/Biblio/IO/$format.pm";
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
318 $load = "Bio/Biblio/IO/$format.pm";
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
319
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
320 return 1 if $main::{$module};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
321 eval {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
322 require $load;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
323 };
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
324 if ( $@ ) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
325 Bio::Root::Root->throw (<<END);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
326 $load: $format cannot be found or loaded
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
327 Exception $@
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
328 For more information about the Biblio system please see the Bio::Biblio::IO docs.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
329 END
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
330 ;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
331 return;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
332 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
333 return 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
334 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
335
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
336 =head2 _guess_format
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
337
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
338 Usage : $class->_guess_format ($filename)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
339 Returns : string with a guessed format of the input data (e.g. 'medlinexml')
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
340 Args : a file name whose extension can help to guess its format
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
341
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
342 It makes an expert guess what kind of data are in the given file
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
343 (but be prepare that $filename may be empty).
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
344
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
345 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
346
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
347 sub _guess_format {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
348 my $class = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
349 return unless $_ = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
350 return 'medlinexml' if (/\.(xml|medlinexml)$/i);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
351 return;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
352 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
353
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
354 sub DESTROY {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
355 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
356
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
357 $self->close();
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
358 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
359
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
360 sub TIEHANDLE {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
361 my ($class,$val) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
362 return bless {'biblio' => $val}, $class;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
363 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
364
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
365 sub READLINE {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
366 my $self = shift;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
367 return $self->{'biblio'}->next_bibref() unless wantarray;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
368 my (@list, $obj);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
369 push @list, $obj while $obj = $self->{'biblio'}->next_bibref();
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
370 return @list;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
371 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
372
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
373 1;