annotate variant_effect_predictor/Bio/SearchIO/Writer/HitTableWriter.pm @ 0:21066c0abaf5 draft

Uploaded
author willmclaren
date Fri, 03 Aug 2012 10:04:48 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
1 # $Id: HitTableWriter.pm,v 1.14 2002/12/24 15:46:47 jason Exp $
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
2
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
3 =head1 NAME
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
4
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
5 Bio::SearchIO::Writer::HitTableWriter - Tab-delimited data for Bio::Search::Hit::HitI objects
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
6
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
7 =head1 SYNOPSIS
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
8
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
9 =head2 Example 1: Using the default columns
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
10
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
11 use Bio::SearchIO;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
12 use Bio::SearchIO::Writer::HitTableWriter;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
13
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
14 my $in = Bio::SearchIO->new();
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
15
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
16 my $writer = Bio::SearchIO::Writer::HitTableWriter->new();
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
17
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
18 my $out = Bio::SearchIO->new( -writer => $writer );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
19
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
20 while ( my $result = $in->next_result() ) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
21 $out->write_result($result, ($in->report_count - 1 ? 0 : 1) );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
22 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
23
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
24 =head2 Example 2: Specifying a subset of columns
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
25
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
26 use Bio::SearchIO;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
27 use Bio::SearchIO::Writer::HitTableWriter;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
28
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
29 my $in = Bio::SearchIO->new();
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
30
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
31 my $writer = Bio::SearchIO::Writer::HitTableWriter->new(
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
32 -columns => [qw(
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
33 query_name
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
34 query_length
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
35 hit_name
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
36 hit_length
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
37 frac_identical_query
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
38 expect
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
39 )] );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
40
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
41 my $out = Bio::SearchIO->new( -writer => $writer,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
42 -file => ">searchio.out" );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
43
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
44 while ( my $result = $in->next_result() ) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
45 $out->write_result($result, ($in->report_count - 1 ? 0 : 1) );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
46 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
47
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
48 =head2 Custom Labels
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
49
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
50 You can also specify different column labels if you don't want to use
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
51 the defaults. Do this by specifying a C<-labels> hash reference
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
52 parameter when creating the HitTableWriter object. The keys of the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
53 hash should be the column number (left-most column = 1) for the label(s)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
54 you want to specify. Here's an example:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
55
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
56 my $writer = Bio::SearchIO::Writer::HitTableWriter->new(
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
57 -columns => [qw( query_name
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
58 query_length
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
59 hit_name
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
60 hit_length )],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
61 -labels => { 1 => 'QUERY_GI',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
62 3 => 'HIT_IDENTIFIER' } );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
63
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
64
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
65 =head1 DESCRIPTION
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
66
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
67 Bio::SearchIO::Writer::HitTableWriter outputs summary data
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
68 for each Hit within a search result. Output is in tab-delimited format,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
69 one row per Hit.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
70
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
71 The reason why this is considered summary data is that if a hit
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
72 contains multiple HSPs, the HSPs will be tiled and
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
73 the data represents a summary across all HSPs.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
74 See below for which columns are affected.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
75 See the docs in L<Bio::Search::Hit::BlastHit|Bio::Search::Hit::BlastHit>
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
76 for more details on HSP tiling.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
77
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
78 =head2 Available Columns
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
79
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
80 Here are the columns that can be specified in the C<-columns>
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
81 parameter when creating a HitTableWriter object. If a C<-columns> parameter
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
82 is not specified, this list, in this order, will be used as the default.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
83
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
84 query_name # Sequence identifier of the query.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
85 query_length # Full length of the query sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
86 hit_name # Sequence identifier of the hit
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
87 hit_length # Full length of the hit sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
88 round # Round number for hit (PSI-BLAST)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
89 expect # Expect value for the alignment
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
90 score # Score for the alignment (e.g., BLAST score)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
91 bits # Bit score for the alignment
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
92 num_hsps # Number of HSPs (not the "N" value)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
93 frac_identical_query* # fraction of identical substitutions in query
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
94 frac_identical_hit* # fraction of identical substitutions in hit
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
95 frac_conserved_query* # fraction of conserved substitutions in query
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
96 frac_conserved_hit* # fraction of conserved substitutions in hit
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
97 frac_aligned_query* # fraction of the query sequence that is aligned
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
98 frac_aligned_hit* # fraction of the hit sequence that is aligned
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
99 length_aln_query* # Length of the aligned portion of the query sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
100 length_aln_hit* # Length of the aligned portion of the hit sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
101 gaps_query* # Number of gaps in the aligned query sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
102 gaps_hit* # Number of gaps in the aligned hit sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
103 gaps_total* # Number of gaps in the aligned query and hit sequences
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
104 start_query* # Starting coordinate of the aligned portion of the query sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
105 end_query* # Ending coordinate of the aligned portion of the query sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
106 start_hit* # Starting coordinate of the aligned portion of the hit sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
107 end_hit* # Ending coordinate of the aligned portion of the hit sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
108 strand_query # Strand of the aligned query sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
109 strand_hit # Strand of the aligned hit sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
110 frame # Frame of the alignment (0,1,2)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
111 ambiguous_aln # Ambiguous alignment indicator ('qs', 'q', 's')
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
112 hit_description # Full description of the hit sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
113 query_description # Full description of the query sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
114
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
115 Items marked with a C<*> report data summed across all HSPs
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
116 after tiling them to avoid counting data from overlapping regions
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
117 multiple times.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
118
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
119 For more details about these columns, see the documentation for the
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
120 corresponding method in Bio::Search::Result::BlastHit.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
121
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
122 =head1 TODO
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
123
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
124 Figure out the best way to incorporate algorithm-specific score columns.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
125 The best route is probably to have algorithm-specific subclasses
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
126 (e.g., BlastHitTableWriter, FastaHitTableWriter).
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
127
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
128 =head1 FEEDBACK
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
129
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
130 =head2 Mailing Lists
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
131
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
132 User feedback is an integral part of the evolution of this and other
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
133 Bioperl modules. Send your comments and suggestions preferably to one
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
134 of the Bioperl mailing lists. Your participation is much appreciated.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
135
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
136 bioperl-l@bioperl.org - General discussion
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
137 http://bioperl.org/MailList.html - About the mailing lists
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
138
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
139 =head2 Reporting Bugs
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
140
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
141 Report bugs to the Bioperl bug tracking system to help us keep track
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
142 the bugs and their resolution. Bug reports can be submitted via email
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
143 or the web:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
144
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
145 bioperl-bugs@bio.perl.org
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
146 http://bugzilla.bioperl.org/
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
147
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
148 =head1 AUTHOR
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
149
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
150 Steve Chervitz E<lt>sac@bioperl.orgE<gt>
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
151
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
152 See L<the FEEDBACK section | FEEDBACK> for where to send bug reports
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
153 and comments.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
154
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
155 =head1 COPYRIGHT
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
156
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
157 Copyright (c) 2001, 2002 Steve Chervitz. All Rights Reserved.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
158
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
159 This library is free software; you can redistribute it and/or modify
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
160 it under the same terms as Perl itself.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
161
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
162 =head1 DISCLAIMER
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
163
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
164 This software is provided "as is" without warranty of any kind.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
165
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
166 =head1 SEE ALSO
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
167
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
168 L<Bio::SearchIO::Writer::HitTableWriter>,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
169 L<Bio::SearchIO::Writer::ResultTableWriter>
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
170
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
171 =head1 METHODS
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
172
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
173 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
174
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
175 package Bio::SearchIO::Writer::HitTableWriter;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
176
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
177 use strict;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
178 use Bio::SearchIO::Writer::ResultTableWriter;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
179
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
180 use vars qw( @ISA );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
181 @ISA = qw( Bio::SearchIO::Writer::ResultTableWriter );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
182
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
183
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
184 # Array fields: column, object, method[/argument], printf format,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
185 # column label Methods for result object are defined in
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
186 # Bio::Search::Result::ResultI. Methods for hit object are defined in
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
187 # Bio::Search::Hit::HitI. Tech note: If a bogus method is supplied,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
188 # it will result in all values to be zero. Don't know why this is.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
189
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
190 # TODO (maybe): Allow specification of separate mantissa/exponent for
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
191 # significance data.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
192
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
193 my %column_map = (
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
194 'query_name' => ['1', 'result', 'query_name', 's', 'QUERY' ],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
195 'query_length' => ['2', 'result', 'query_length', 'd', 'LEN_Q'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
196 'hit_name' => ['3', 'hit', 'name', 's', 'HIT'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
197 'hit_length' => ['4', 'hit', 'length', 'd', 'LEN_H'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
198 'round' => ['5', 'hit', 'iteration', 'd', 'ROUND'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
199 'expect' => ['6', 'hit', 'significance', '.1e', 'EXPCT'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
200 'score' => ['7', 'hit', 'raw_score', 'd', 'SCORE'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
201 'bits' => ['8', 'hit', 'bits', 'd', 'BITS'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
202 'num_hsps' => ['9', 'hit', 'num_hsps', 'd', 'HSPS'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
203 'frac_identical_query' => ['10', 'hit', 'frac_identical/query', '.2f', 'FR_IDQ'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
204 'frac_identical_hit' => ['11', 'hit', 'frac_identical/hit', '.2f', 'FR_IDH'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
205 'frac_conserved_query' => ['12', 'hit', 'frac_conserved/query', '.2f', 'FR_CNQ'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
206 'frac_conserved_hit' => ['13', 'hit', 'frac_conserved/hit', '.2f', 'FR_CNH'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
207 'frac_aligned_query' => ['14', 'hit', 'frac_aligned_query', '.2f', 'FR_ALQ'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
208 'frac_aligned_hit' => ['15', 'hit', 'frac_aligned_hit', '.2f', 'FR_ALH'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
209 'length_aln_query' => ['16', 'hit', 'length_aln/query', 'd', 'LN_ALQ'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
210 'length_aln_hit' => ['17', 'hit', 'length_aln/hit', 'd', 'LN_ALH'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
211 'gaps_query' => ['18', 'hit', 'gaps/query', 'd', 'GAPS_Q'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
212 'gaps_hit' => ['19', 'hit', 'gaps/hit', 'd', 'GAPS_H'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
213 'gaps_total' => ['20', 'hit', 'gaps/total', 'd', 'GAPS_QH'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
214 'start_query' => ['21', 'hit', 'start/query', 'd', 'START_Q'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
215 'end_query' => ['22', 'hit', 'end/query', 'd', 'END_Q'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
216 'start_hit' => ['23', 'hit', 'start/hit', 'd', 'START_H'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
217 'end_hit' => ['24', 'hit', 'end/hit', 'd', 'END_H'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
218 'strand_query' => ['25', 'hit', 'strand/query', 's', 'STRND_Q'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
219 'strand_hit' => ['26', 'hit', 'strand/hit', 's', 'STRND_H'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
220 'frame' => ['27', 'hit', 'frame', 'd', 'FRAME'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
221 'ambiguous_aln' => ['28', 'hit', 'ambiguous_aln', 's', 'AMBIG'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
222 'hit_description' => ['29', 'hit', 'description', 's', 'DESC_H'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
223 'query_description' => ['30', 'result', 'query_description', 's', 'DESC_Q'],
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
224 );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
225
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
226 sub column_map { return %column_map }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
227
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
228
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
229 =head2 to_string()
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
230
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
231 Note: this method is not intended for direct use. The
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
232 SearchIO::write_result() method calls it automatically if the writer
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
233 is hooked up to a SearchIO object as illustrated in
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
234 L<the SYNOPSIS section | SYNOPSIS>.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
235
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
236 Title : to_string()
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
237 :
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
238 Usage : print $writer->to_string( $result_obj, [$include_labels] );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
239 :
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
240 Argument : $result_obj = A Bio::Search::Result::BlastResult object
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
241 : $include_labels = boolean, if true column labels are included (default: false)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
242 :
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
243 Returns : String containing tab-delimited set of data for each hit
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
244 : in a BlastResult object. Some data is summed across multiple HSPs.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
245 :
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
246 Throws : n/a
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
247
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
248 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
249
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
250 #----------------
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
251 sub to_string {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
252 #----------------
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
253 my ($self, $result, $include_labels) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
254
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
255 my $str = $include_labels ? $self->column_labels() : '';
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
256 my $func_ref = $self->row_data_func;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
257 my $printf_fmt = $self->printf_fmt;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
258
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
259 my ($resultfilter,$hitfilter) = ( $self->filter('RESULT'),
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
260 $self->filter('HIT') );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
261 if( ! defined $resultfilter ||
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
262 &{$resultfilter}($result) ) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
263 $result->can('rewind') &&
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
264 $result->rewind(); # insure we're at the beginning
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
265 foreach my $hit($result->hits) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
266 next if( defined $hitfilter && ! &{$hitfilter}($hit));
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
267 my @row_data = map { defined $_ ? $_ : 0 } &{$func_ref}($result, $hit);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
268 $str .= sprintf "$printf_fmt\n", @row_data;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
269 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
270 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
271 $str =~ s/\t\n/\n/gs;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
272 return $str;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
273 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
274
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
275 =head2 end_report
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
276
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
277 Title : end_report
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
278 Usage : $self->end_report()
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
279 Function: The method to call when ending a report, this is
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
280 mostly for cleanup for formats which require you to
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
281 have something at the end of the document. Nothing for
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
282 a text message.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
283 Returns : string
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
284 Args : none
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
285
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
286 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
287
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
288 sub end_report {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
289 return '';
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
290 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
291
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
292
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
293 =head2 filter
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
294
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
295 Title : filter
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
296 Usage : $writer->filter('hsp', \&hsp_filter);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
297 Function: Filter out either at HSP,Hit,or Result level
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
298 Returns : none
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
299 Args : string => data type,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
300 CODE reference
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
301
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
302
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
303 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
304
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
305 1;