annotate variant_effect_predictor/Bio/AlignIO/bl2seq.pm @ 2:a5976b2dce6f

changing defualt values for ensembl database
author mahtabm
date Thu, 11 Apr 2013 17:15:42 +1000
parents 1f6dce3d34e0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: bl2seq.pm,v 1.13.2.1 2003/06/18 12:19:52 jason Exp $
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 # BioPerl module for Bio::AlignIO::bl2seq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5 # based on the Bio::SeqIO modules
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 # by Ewan Birney <birney@sanger.ac.uk>
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7 # and Lincoln Stein <lstein@cshl.org>
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9 # the Bio::Tools::BPlite modules by
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10 # Ian Korf (ikorf@sapiens.wustl.edu, http://sapiens.wustl.edu/~ikorf),
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11 # Lorenz Pollak (lorenz@ist.org, bioperl port)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13 # and the SimpleAlign.pm module of Ewan Birney
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15 # Copyright Peter Schattner
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17 # You may distribute this module under the same terms as perl itself
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18 # _history
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19 # September 5, 2000
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20 # POD documentation - main docs before the code
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22 =head1 NAME
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24 Bio::AlignIO::bl2seq - bl2seq sequence input/output stream
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28 Do not use this module directly. Use it via the L<Bio::AlignIO> class, as in:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30 use Bio::AlignIO;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32 $in = Bio::AlignIO->new(-file => "inputfilename" , '-format' => 'bl2seq');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33 $aln = $in->next_aln();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36 =head1 DESCRIPTION
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38 This object can create L<Bio::SimpleAlign> sequence alignment objects (of
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39 2 sequences) from bl2seq BLAST reports.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41 A nice feature of this module is that- in combination with
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42 StandAloneBlast.pm or remote blasting - it can be used to align 2
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43 sequences and make a SimpleAlign object from them which can then be
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44 manipulated using any SimpleAlign.pm methods, eg:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46 #Get 2 sequences
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47 $str = Bio::SeqIO->new(-file=>'t/amino.fa' , '-format' => 'Fasta', );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48 my $seq3 = $str->next_seq();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49 my $seq4 = $str->next_seq();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51 # Run bl2seq on them
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52 $factory = Bio::Tools::StandAloneBlast->new('program' => 'blastp',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53 'outfile' => 'bl2seq.out');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54 my $bl2seq_report = $factory->bl2seq($seq3, $seq4);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56 # Use AlignIO.pm to create a SimpleAlign object from the bl2seq report
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57 $str = Bio::AlignIO->new(-file=> 'bl2seq.out','-format' => 'bl2seq');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58 $aln = $str->next_aln();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60 Pass in -report_type flag when initializing the object to have this
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61 pass through to the Bio::Tools::BPbl2seq object. See that object.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63 =head1 FEEDBACK
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65 =head2 Mailing Lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67 User feedback is an integral part of the evolution of this and other
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68 Bioperl modules. Send your comments and suggestions preferably to one
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69 of the Bioperl mailing lists. Your participation is much appreciated.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71 bioperl-l@bioperl.org - General discussion
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72 http://bio.perl.org/MailList.html - About the mailing lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74 =head2 Reporting Bugs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76 Report bugs to the Bioperl bug tracking system to help us keep track
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77 the bugs and their resolution.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78 Bug reports can be submitted via email or the web:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80 bioperl-bugs@bio.perl.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81 http://bugzilla.bioperl.org/
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83 =head1 AUTHOR - Peter Schattner
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85 Email: schattner@alum.mit.edu
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88 =head1 APPENDIX
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90 The rest of the documentation details each of the object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91 methods. Internal methods are usually preceded with a _
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95 # Let the code begin...
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97 package Bio::AlignIO::bl2seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98 use vars qw(@ISA);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100 # Object preamble - inherits from Bio::Root::Object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102 use Bio::AlignIO;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103 use Bio::Tools::BPbl2seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105 @ISA = qw(Bio::AlignIO);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109 sub _initialize {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110 my ($self,@args) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111 $self->SUPER::_initialize(@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112 ($self->{'report_type'}) = $self->_rearrange([qw(REPORT_TYPE)],
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113 @args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114 return 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117 =head2 next_aln
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119 Title : next_aln
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120 Usage : $aln = $stream->next_aln()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121 Function: returns the next alignment in the stream.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122 Returns : L<Bio::Align::AlignI> object - returns 0 on end of file
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123 or on error
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124 Args : NONE
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128 sub next_aln {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129 my $self = shift;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130 my ($start,$end,$name,$seqname,$seq,$seqchar);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131 my $aln = Bio::SimpleAlign->new(-source => 'bl2seq');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132 $self->{'bl2seqobj'} =
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133 $self->{'bl2seqobj'} || Bio::Tools::BPbl2seq->new(-fh => $self->_fh,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134 -report_type => $self->{'report_type'});
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135 my $bl2seqobj = $self->{'bl2seqobj'};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136 my $hsp = $bl2seqobj->next_feature;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137 $seqchar = $hsp->querySeq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 $start = $hsp->query->start;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139 $end = $hsp->query->end;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 $seqname = 'Query-sequence'; # Query name not present in bl2seq report
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142 # unless ($seqchar && $start && $end && $seqname) {return 0} ;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143 unless ($seqchar && $start && $end ) {return 0} ;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145 $seq = new Bio::LocatableSeq('-seq'=>$seqchar,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146 '-id'=>$seqname,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147 '-start'=>$start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148 '-end'=>$end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149 );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151 $aln->add_seq($seq);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
153 $seqchar = $hsp->sbjctSeq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
154 $start = $hsp->hit->start;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
155 $end = $hsp->hit->end;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
156 $seqname = $bl2seqobj->sbjctName;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
157
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
158 unless ($seqchar && $start && $end && $seqname) {return 0} ;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
159
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
160 $seq = new Bio::LocatableSeq('-seq'=>$seqchar,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
161 '-id'=>$seqname,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
162 '-start'=>$start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
163 '-end'=>$end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
164 );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
165
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
166 $aln->add_seq($seq);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
167
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
168 return $aln;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
169
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
170 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
171
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
172
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
173 =head2 write_aln
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
174
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
175 Title : write_aln
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
176 Usage : $stream->write_aln(@aln)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
177 Function: writes the $aln object into the stream in bl2seq format
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
178 Returns : 1 for success and 0 for error
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
179 Args : L<Bio::Align::AlignI> object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
180
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
181
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
182 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
183
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
184 sub write_aln {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
185 my ($self,@aln) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
186
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
187 $self->throw("Sorry: writing bl2seq output is not available! /n");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
188 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
189
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
190 1;