annotate variant_effect_predictor/Bio/Tools/Seg.pm @ 0:2bc9b66ada89 draft default tip

Uploaded
author mahtabm
date Thu, 11 Apr 2013 06:29:17 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: Seg.pm,v 1.6 2002/10/22 07:45:22 lapp Exp $
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
2 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
3 # BioPerl module for Bio::Tools::Seg
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
4 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
5 # Copyright Balamurugan Kumarasamy
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
6 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
7 # You may distribute this module under the same terms as perl itself
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
8 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
9 # POD documentation - main docs before the code
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
10 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
11 # Copyright
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
12 #
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
13 # You may distribute this module under the same terms as perl itself
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
14 # POD documentation - main docs before the code
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
15
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
16 =head1 NAME
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
17
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
18 Bio::Tools::Seg - parse Seg output (filter low complexity protein sequence)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
19
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
20 =head1 SYNOPSIS
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
21
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
22 use Bio::Tools::Seg;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
23 my $parser = new Bio::Tools::Seg(-fh =>$filehandle );
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
24 while( my $seg_feat = $parser->next_result ) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
25 #do something
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
26 #eg
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
27 push @seg_feat, $seg_feat;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
28 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
29
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
30 =head1 DESCRIPTION
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
31
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
32 Parser for Seg output
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
33
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
34 =head1 FEEDBACK
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
35
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
36 =head2 Mailing Lists
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
37
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
38 User feedback is an integral part of the evolution of this and other
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
39 Bioperl modules. Send your comments and suggestions preferably to
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
40 the Bioperl mailing list. Your participation is much appreciated.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
41
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
42 bioperl-l@bioperl.org - General discussion
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
43 http://bioperl.org/MailList.shtml - About the mailing lists
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
44
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
45 =head2 Reporting Bugs
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
46
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
47 Report bugs to the Bioperl bug tracking system to help us keep track
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
48 of the bugs and their resolution. Bug reports can be submitted via
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
49 email or the web:
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
50
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
51 bioperl-bugs@bioperl.org
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
52 http://bugzilla.bioperl.org/
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
53
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
54 =head1 AUTHOR - Bala
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
55
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
56 Email savikalpa@fugu-sg.org
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
57
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
58
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
59 =head1 CONTRIBUTORS
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
60
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
61 Additional contributors names and emails here
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
62
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
63 =head1 APPENDIX
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
64
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
65 The rest of the documentation details each of the object methods.
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
66 Internal methods are usually preceded with a _
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
67
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
68 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
69
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
70 package Bio::Tools::Seg;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
71 use vars qw(@ISA);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
72 use strict;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
73
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
74 use Bio::Root::Root;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
75 use Bio::SeqFeature::FeaturePair;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
76 use Bio::Root::IO;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
77 use Bio::SeqFeature::Generic;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
78 @ISA = qw(Bio::Root::Root Bio::Root::IO);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
79
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
80
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
81
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
82
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
83
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
84 =head2 new
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
85
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
86 Title : new
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
87 Usage : my $obj = new Bio::Tools::Seg();
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
88 Function: Builds a new Bio::Tools::Seg object
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
89 Returns : Bio::Tools::Seg
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
90 Args : -fh/-file => $val, # for initing input, see Bio::Root::IO
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
91
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
92
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
93 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
94
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
95
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
96 sub new {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
97 my($class,@args) = @_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
98
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
99 my $self = $class->SUPER::new(@args);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
100 $self->_initialize_io(@args);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
101
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
102 return $self;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
103 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
104
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
105 =head2 next_result
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
106
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
107 Title : next_result
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
108 Usage : my $feat = $seg->next_result
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
109 Function: Get the next result set from parser data
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
110 Returns : Bio::SeqFeature::Generic
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
111 Args : none
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
112
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
113
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
114 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
115
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
116 sub next_result {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
117 my ($self) = @_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
118
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
119 my $line;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
120 # parse
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
121 my $id;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
122 while ($_=$self->_readline()) {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
123 $line = $_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
124 chomp $line;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
125
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
126 next if /^$/;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
127 if ($line=~/^\>/) { #if it is a line starting with a ">"
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
128 $line=~/^\>\s*(\S+)\s*\((\d+)\-(\d+)\)\s*complexity=(\S+)/;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
129 my $id = $1;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
130 my $start = $2;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
131 my $end = $3;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
132 my $score = $4;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
133
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
134 #for example in this line test_prot(214-226) complexity=2.26 (12/2.20/2.50)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
135 #$1 is test_prot $2 is 214 $3 is 226 and $4 is 2.26
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
136
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
137 my (%feature);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
138 $feature{name} = $id;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
139 $feature{score} = $score;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
140 $feature{start} = $start;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
141 $feature{end} = $end;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
142 $feature{source} = "Seg";
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
143 $feature{primary} = 'low_complexity';
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
144 $feature{program} = "Seg";
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
145 $feature{logic_name} = 'low_complexity';
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
146 my $new_feat = $self->create_feature (\%feature);
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
147 return $new_feat;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
148 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
149 next;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
150 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
151
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
152 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
153
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
154
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
155 =head2 create_feature
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
156
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
157 Title : create_feature
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
158 Usage : obj->create_feature(\%feature)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
159 Function: Internal(not to be used directly)
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
160 Returns :
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
161 Args :
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
162
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
163
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
164 =cut
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
165
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
166 sub create_feature {
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
167 my ($self, $feat) = @_;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
168
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
169
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
170 # create feature object
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
171 my $feature = Bio::SeqFeature::Generic->new(-seq_id => $feat->{name},
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
172 -start => $feat->{start},
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
173 -end => $feat->{end},
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
174 -score => $feat->{score},
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
175 -source => $feat->{source},
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
176 -primary => $feat->{primary},
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
177 -logic_name => $feat->{logic_name},
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
178 );
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
179
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
180 return $feature;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
181
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
182 }
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
183
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
184 1;
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
185
2bc9b66ada89 Uploaded
mahtabm
parents:
diff changeset
186