annotate variant_effect_predictor/Bio/Biblio/IO.pm @ 0:1f6dce3d34e0

Uploaded
author mahtabm
date Thu, 11 Apr 2013 02:01:53 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: IO.pm,v 1.8 2002/10/22 07:45:11 lapp Exp $
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 # BioPerl module for Bio::Biblio::IO
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5 # Cared for by Martin Senger <senger@ebi.ac.uk>
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 # For copyright and disclaimer see below.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8 # POD documentation - main docs before the code
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10 =head1 NAME
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12 Bio::Biblio::IO - Handling the bibliographic references
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16 use Bio::Biblio::IO;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18 # getting citations from a file
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19 $in = Bio::Biblio::IO->new ('-file' => 'myfile.xml' ,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20 '-format' => 'medlinexml');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21 --- OR ---
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23 # getting citations from a string
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24 $in = Bio::Biblio::IO->new ('-data' => '<MedlineCitation>...</MedlineCitation>' ,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25 '-format' => 'medlinexml');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26 --- OR ---
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28 # getting citations from a string if IO::String is installed
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29 use IO::String;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30 $in = Bio::Biblio::IO->new ('-fh' => IO::String->new ($citation),
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31 '-format' => 'medlinexml');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33 $in = Bio::Biblio::IO->new(-fh => $io_handle , '-format' => 'medlinexml');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35 --- OR ---
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37 # getting citations from any IO handler
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38 $in = Bio::Biblio::IO->new('-fh' => $io_handle ,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39 '-format' => 'medlinexml');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42 # now, having $in, we can read all citations
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43 while ( my $citation = $in->next_bibref() ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44 &do_something_with_citation ($citation);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47 --- OR ---
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49 # again reading all citation but now a callback defined in your
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50 # code is used (note that the reading starts already when new()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51 # is called)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52 $io = new Bio::Biblio::IO ('-format' => 'medlinexml',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53 '-file' => $testfile,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54 '-callback' => \&callback);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55 sub callback {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56 my $citation = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57 print $citation->{'_identifier'} . "\n";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60 Now, to actually get a citation in an XML format,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61 use I<Bio::Biblio> module which returns an XML string:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63 use Bio::Biblio;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64 my $xml = new Bio::Biblio->get_by_id ('94033980');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65 my $reader = Bio::Biblio::IO->new ('-data' => $xml,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66 '-format' => 'medlinexml');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68 while (my $citation = $reader->next_bibref()) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69 ... do something here with $citation
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72 And, finally, the resulting citation can be received in different
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73 output formats:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75 $io = new Bio::Biblio::IO ('-format' => 'medlinexml',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76 '-result' => 'raw');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77 --- OR ---
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79 $io = new Bio::Biblio::IO ('-format' => 'medlinexml',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80 '-result' => 'medline2ref');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82 --- OR ---
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84 $io = new Bio::Biblio::IO ('-format' => 'pubmedxml',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85 '-result' => 'pubmed2ref');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87 =head1 DESCRIPTION
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89 Bio::Biblio::IO is a handler module for accessing bibliographic
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90 citations. The citations can be in different formats - assuming that
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91 there is a corresponding module knowing that format in Bio::Biblio::IO
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92 directory (e.g. Bio::Biblio::IO::medlinexml). The format (and the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93 module name) is given by the argument I<-format>.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95 Once an instance of C<Bio::Biblio::IO> class is available, the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96 citations can be read by calling repeatedly method I<next_bibref>:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98 while (my $citation = $reader->next_bibref()) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99 ... do something here with $citation
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102 However, this may imply that all citations were already read into the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103 memory. If you expect a huge amount of citations to be read, you may
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104 choose a I<callback> option. Your subroutine is specified in the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105 C<new()> method and is called everytime a new citation is available
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106 (see an example above in SYNOPSIS).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108 The citations returned by I<next_bibref> or given to your callback
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109 routine can be of different formats depending on the argument
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110 I<-result>. One result type is I<raw> and it is represented by a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111 simple, not blessed hash table:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113 $io = new Bio::Biblio::IO ('-result' => 'raw');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115 What other result formats are available depends on the module who
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116 reads the citations in the first place. At the moment, the following
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117 ones are available:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119 $io = new Bio::Biblio::IO ('-result' => 'medline2ref');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121 This is a default result format for reading citations by the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122 I<medlinexml> module. The C<medlinexml> module is again the default
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123 one. Which means that you can almost omit arguments (you still need to
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124 say where the citations come from):
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126 $io = new Bio::Biblio::IO ('-file' => 'data/medline_data.xml');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128 Another result format available is for PUBMED citations (which is a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129 super-set of the MEDLINE citations having few more tags):
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131 $io = new Bio::Biblio::IO ('-format' => 'pubmedxml',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132 '-result' => 'pubmed2ref',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133 '-data' => $citation);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135 Or, because C<pubmed2ref> is a default one for PUBMED citations, you can say just:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137 $io = new Bio::Biblio::IO ('-format' => 'pubmedxml',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 '-data' => $citation);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 Both C<medline2ref> and C<pubmed2ref> results are objects defined in
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141 the directory C<Bio::Biblio>.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143 =head1 SEE ALSO
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145 =over
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147 =item *
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149 An example script I<examples/biblio.pl>. It has many options and its
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150 own help. The relevant options to this IO module are I<-f>
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151 (specifying what file to read) and I<-O> (specifying what result
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152 format to achieve).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
153
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
154 =item *
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
155
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
156 OpenBQS home page: http://industry.ebi.ac.uk/openBQS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
157
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
158 =item *
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
159
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
160 Comments to the Perl client: http://industry.ebi.ac.uk/openBQS/Client_perl.html
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
161
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
162 =back
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
163
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
164 =head1 FEEDBACK
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
165
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
166 =head2 Mailing Lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
167
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
168 User feedback is an integral part of the evolution of this
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
169 and other Bioperl modules. Send your comments and suggestions preferably
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
170 to one of the Bioperl mailing lists.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
171 Your participation is much appreciated.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
172
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
173 bioperl-l@bioperl.org - General discussion
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
174 http://bioperl.org/MailList.shtml - About the mailing lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
175
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
176 =head2 Reporting Bugs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
177
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
178 Report bugs to the Bioperl bug tracking system to help us keep track
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
179 the bugs and their resolution.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
180 Bug reports can be submitted via email or the web:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
181
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
182 bioperl-bugs@bioperl.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
183 http://bugzilla.bioperl.org/
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
184
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
185 =head1 AUTHOR
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
186
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
187 Martin Senger (senger@ebi.ac.uk)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
188
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
189 =head1 COPYRIGHT
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
190
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
191 Copyright (c) 2002 European Bioinformatics Institute. All Rights Reserved.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
192
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
193 This module is free software; you can redistribute it and/or modify
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
194 it under the same terms as Perl itself.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
195
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
196 =head1 DISCLAIMER
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
197
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
198 This software is provided "as is" without warranty of any kind.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
199
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
200 =head1 APPENDIX
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
201
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
202 The rest of the documentation details each of the object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
203 methods. Internal methods are preceded with a _
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
204
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
205 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
206
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
207
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
208 # Let the code begin...
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
209
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
210 package Bio::Biblio::IO;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
211
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
212 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
213 use vars qw(@ISA);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
214
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
215 use Bio::Root::Root;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
216 use Bio::Root::IO;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
217 use Symbol();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
218
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
219 @ISA = qw(Bio::Root::Root Bio::Root::IO);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
220
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
221 my $entry = 0;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
222
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
223 sub new {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
224 my ($caller, @args) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
225 my $class = ref ($caller) || $caller;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
226
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
227 # if $caller is an object, or if it is an underlying
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
228 # 'real-work-doing' class (e.g. Bio::Biblio::IO::medlinexml) then
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
229 # we want to call SUPER to create and bless an object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
230 if( $class =~ /Bio::Biblio::IO::(\S+)/ ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
231 my ($self) = $class->SUPER::new (@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
232 $self->_initialize (@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
233 return $self;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
234
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
235 # this is called only the first time when somebody calls: 'new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
236 # Bio::Biblio::IO (...)', and it actually loads a 'real-work-doing'
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
237 # module and call this new() method again (unless the loaded
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
238 # module has its own new() method)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
239 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
240 my %param = @args;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
241 @param{ map { lc $_ } keys %param } = values %param; # lowercase keys
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
242 my $format = $param{'-format'} ||
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
243 $class->_guess_format( $param{-file} || $ARGV[0] ) ||
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
244 'medlinexml';
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
245 $format = "\L$format"; # normalize capitalization to lower case
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
246
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
247 # load module with the real implementation - as defined in $format
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
248 return undef unless (&_load_format_module ($format));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
249
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
250 # this will call this same method new() - but rather its
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
251 # upper (object) branche
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
252 return "Bio::Biblio::IO::$format"->new(@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
253 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
254 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
255
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
256 sub newFh {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
257 my $class = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
258 return unless my $self = $class->new(@_);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
259 return $self->fh;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
260 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
261
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
262
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
263 sub fh {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
264 my $self = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
265 my $class = ref($self) || $self;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
266 my $s = Symbol::gensym;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
267 tie $$s,$class,$self;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
268 return $s;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
269 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
270
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
271 # _initialize is chained for all Bio::Biblio::IO classes
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
272
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
273 sub _initialize {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
274 my ($self, @args) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
275 # initialize the IO part
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
276 $self->_initialize_io (@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
277 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
278
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
279 =head2 next_bibref
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
280
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
281 Usage : $citation = stream->next_bibref
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
282 Function: Reads the next citation object from the stream and returns it.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
283 Returns : a Bio::Biblio::Ref citation object, or something else
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
284 (depending on the '-result' argument given in the 'new()'
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
285 method).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
286 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
287
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
288 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
289
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
290 sub next_bibref {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
291 my ($self) = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
292 $self->throw ("Sorry, you cannot read from a generic Bio::Biblio::IO object.");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
293 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
294
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
295 # -----------------------------------------------------------------------------
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
296
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
297 =head2 _load_format_module
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
298
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
299 Usage : $class->_load_format_module ($format)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
300 Returns : 1 on success, undef on failure
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
301 Args : 'format' should contain the last part of the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
302 name of a module who does the real implementation
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
303
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
304 It does (in run-time) a similar thing as
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
305
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
306 require Bio::Biblio::IO::$format
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
307
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
308 It throws an exception if it fails to find and load the module
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
309 (for example, because of the compilation errors in the module).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
310
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
311 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
312
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
313 sub _load_format_module {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
314 my ($format) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
315 my ($module, $load, $m);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
316
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
317 $module = "_<Bio/Biblio/IO/$format.pm";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
318 $load = "Bio/Biblio/IO/$format.pm";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
319
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
320 return 1 if $main::{$module};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
321 eval {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
322 require $load;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
323 };
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
324 if ( $@ ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
325 Bio::Root::Root->throw (<<END);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
326 $load: $format cannot be found or loaded
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
327 Exception $@
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
328 For more information about the Biblio system please see the Bio::Biblio::IO docs.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
329 END
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
330 ;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
331 return;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
332 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
333 return 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
334 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
335
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
336 =head2 _guess_format
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
337
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
338 Usage : $class->_guess_format ($filename)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
339 Returns : string with a guessed format of the input data (e.g. 'medlinexml')
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
340 Args : a file name whose extension can help to guess its format
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
341
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
342 It makes an expert guess what kind of data are in the given file
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
343 (but be prepare that $filename may be empty).
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
344
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
345 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
346
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
347 sub _guess_format {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
348 my $class = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
349 return unless $_ = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
350 return 'medlinexml' if (/\.(xml|medlinexml)$/i);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
351 return;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
352 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
353
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
354 sub DESTROY {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
355 my $self = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
356
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
357 $self->close();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
358 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
359
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
360 sub TIEHANDLE {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
361 my ($class,$val) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
362 return bless {'biblio' => $val}, $class;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
363 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
364
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
365 sub READLINE {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
366 my $self = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
367 return $self->{'biblio'}->next_bibref() unless wantarray;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
368 my (@list, $obj);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
369 push @list, $obj while $obj = $self->{'biblio'}->next_bibref();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
370 return @list;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
371 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
372
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
373 1;