annotate variant_effect_predictor/Bio/Tools/Seg.pm @ 3:d30fa12e4cc5 default tip

Merge heads 2:a5976b2dce6f and 1:09613ce8151e which were created as a result of a recently fixed bug.
author devteam <devteam@galaxyproject.org>
date Mon, 13 Jan 2014 10:38:30 -0500
parents 1f6dce3d34e0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: Seg.pm,v 1.6 2002/10/22 07:45:22 lapp Exp $
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 # BioPerl module for Bio::Tools::Seg
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5 # Copyright Balamurugan Kumarasamy
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7 # You may distribute this module under the same terms as perl itself
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9 # POD documentation - main docs before the code
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11 # Copyright
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13 # You may distribute this module under the same terms as perl itself
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14 # POD documentation - main docs before the code
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16 =head1 NAME
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18 Bio::Tools::Seg - parse Seg output (filter low complexity protein sequence)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22 use Bio::Tools::Seg;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23 my $parser = new Bio::Tools::Seg(-fh =>$filehandle );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24 while( my $seg_feat = $parser->next_result ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25 #do something
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26 #eg
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27 push @seg_feat, $seg_feat;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30 =head1 DESCRIPTION
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32 Parser for Seg output
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34 =head1 FEEDBACK
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36 =head2 Mailing Lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38 User feedback is an integral part of the evolution of this and other
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39 Bioperl modules. Send your comments and suggestions preferably to
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40 the Bioperl mailing list. Your participation is much appreciated.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42 bioperl-l@bioperl.org - General discussion
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43 http://bioperl.org/MailList.shtml - About the mailing lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45 =head2 Reporting Bugs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47 Report bugs to the Bioperl bug tracking system to help us keep track
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48 of the bugs and their resolution. Bug reports can be submitted via
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49 email or the web:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51 bioperl-bugs@bioperl.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52 http://bugzilla.bioperl.org/
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54 =head1 AUTHOR - Bala
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56 Email savikalpa@fugu-sg.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59 =head1 CONTRIBUTORS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61 Additional contributors names and emails here
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63 =head1 APPENDIX
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65 The rest of the documentation details each of the object methods.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66 Internal methods are usually preceded with a _
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70 package Bio::Tools::Seg;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71 use vars qw(@ISA);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74 use Bio::Root::Root;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75 use Bio::SeqFeature::FeaturePair;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76 use Bio::Root::IO;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77 use Bio::SeqFeature::Generic;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78 @ISA = qw(Bio::Root::Root Bio::Root::IO);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84 =head2 new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86 Title : new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87 Usage : my $obj = new Bio::Tools::Seg();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88 Function: Builds a new Bio::Tools::Seg object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89 Returns : Bio::Tools::Seg
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90 Args : -fh/-file => $val, # for initing input, see Bio::Root::IO
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96 sub new {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97 my($class,@args) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99 my $self = $class->SUPER::new(@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100 $self->_initialize_io(@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102 return $self;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105 =head2 next_result
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107 Title : next_result
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108 Usage : my $feat = $seg->next_result
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109 Function: Get the next result set from parser data
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110 Returns : Bio::SeqFeature::Generic
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116 sub next_result {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119 my $line;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120 # parse
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121 my $id;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122 while ($_=$self->_readline()) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123 $line = $_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124 chomp $line;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126 next if /^$/;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127 if ($line=~/^\>/) { #if it is a line starting with a ">"
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128 $line=~/^\>\s*(\S+)\s*\((\d+)\-(\d+)\)\s*complexity=(\S+)/;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129 my $id = $1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130 my $start = $2;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131 my $end = $3;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132 my $score = $4;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134 #for example in this line test_prot(214-226) complexity=2.26 (12/2.20/2.50)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135 #$1 is test_prot $2 is 214 $3 is 226 and $4 is 2.26
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137 my (%feature);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 $feature{name} = $id;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139 $feature{score} = $score;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 $feature{start} = $start;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141 $feature{end} = $end;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142 $feature{source} = "Seg";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143 $feature{primary} = 'low_complexity';
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144 $feature{program} = "Seg";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145 $feature{logic_name} = 'low_complexity';
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146 my $new_feat = $self->create_feature (\%feature);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147 return $new_feat;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149 next;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
153
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
154
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
155 =head2 create_feature
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
156
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
157 Title : create_feature
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
158 Usage : obj->create_feature(\%feature)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
159 Function: Internal(not to be used directly)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
160 Returns :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
161 Args :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
162
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
163
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
164 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
165
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
166 sub create_feature {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
167 my ($self, $feat) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
168
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
169
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
170 # create feature object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
171 my $feature = Bio::SeqFeature::Generic->new(-seq_id => $feat->{name},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
172 -start => $feat->{start},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
173 -end => $feat->{end},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
174 -score => $feat->{score},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
175 -source => $feat->{source},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
176 -primary => $feat->{primary},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
177 -logic_name => $feat->{logic_name},
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
178 );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
179
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
180 return $feature;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
181
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
182 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
183
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
184 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
185
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
186