annotate variant_effect_predictor/Bio/Tools/Tmhmm.pm @ 0:21066c0abaf5 draft

Uploaded
author willmclaren
date Fri, 03 Aug 2012 10:04:48 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
1 # $Id: Tmhmm.pm,v 1.6 2002/10/22 07:45:22 lapp Exp $
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
2 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
3 # BioPerl module for Bio::Tools::Tmhmm
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
4 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
5 # Copyright Balamurugan Kumarasamy
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
6 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
7 # You may distribute this module under the same terms as perl itself
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
8 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
9 # POD documentation - main docs before the code
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
10 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
11 # Copyright
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
12 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
13 # You may distribute this module under the same terms as perl itself
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
14
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
15 =head1 NAME
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
16
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
17 Bio::Tools::Tmhmm - parse TmHMM output (transmembrane HMM)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
18
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
19 =head1 SYNOPSIS
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
20
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
21 use Bio::Tools::Tmhmm;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
22 my $parser = new Bio::Tools::Tmhmm(-fh =>$filehandle );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
23 while( my $tmhmm_feat = $parser->next_result ) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
24 #do something
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
25 #eg
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
26 push @tmhmm_feat, $tmhmm_feat;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
27 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
28
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
29 =head1 DESCRIPTION
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
30
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
31 Parser for Tmhmm output
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
32
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
33 =head1 FEEDBACK
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
34
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
35 =head2 Mailing Lists
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
36
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
37 user feedback is an integral part of the evolution of this and other
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
38 Bioperl modules. Send your comments and suggestions preferably to
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
39 the Bioperl mailing list. Your participation is much appreciated.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
40
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
41 bioperl-l@bioperl.org - General discussion
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
42 http://bioperl.org/MailList.shtml - About the mailing lists
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
43
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
44 =head2 Reporting Bugs
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
45
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
46 Report bugs to the Bioperl bug tracking system to help us keep track
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
47 of the bugs and their resolution. Bug reports can be submitted via
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
48 email or the web:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
49
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
50 bioperl-bugs@bioperl.org
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
51 http://bugzilla.bioperl.org/
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
52
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
53 =head1 AUTHOR - Bala
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
54
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
55 Email savikalpa@fugu-sg.org
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
56
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
57
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
58 =head1 APPENDIX
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
59
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
60 The rest of the documentation details each of the object methods.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
61 Internal methods are usually preceded with a _
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
62
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
63 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
64
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
65 package Bio::Tools::Tmhmm;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
66 use vars qw(@ISA);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
67 use strict;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
68
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
69 use Bio::Tools::AnalysisResult;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
70 use Bio::Root::Root;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
71 use Bio::SeqFeature::FeaturePair;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
72 use Bio::Root::IO;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
73 use Bio::SeqFeature::Generic;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
74 @ISA = qw(Bio::Root::Root Bio::Root::IO Bio::Tools::AnalysisResult);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
75
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
76
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
77
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
78 =head2 new
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
79
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
80 Title : new
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
81 Usage : my $obj = new Bio::Tools::Tmhmm();
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
82 Function: Builds a new Bio::Tools::Tmhmm object
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
83 Returns : Bio::Tools::Tmhmm
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
84 Args : -fh/-file => $val, # for initing input, see Bio::Root::IO
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
85
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
86
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
87 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
88
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
89 sub new {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
90 my($class,@args) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
91
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
92 my $self = $class->SUPER::new(@args);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
93 $self->_initialize_io(@args);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
94
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
95 return $self;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
96 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
97
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
98
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
99 =head2 next_result
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
100
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
101 Title : next_result
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
102 Usage : my $feat = $Tmhmm->next_result
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
103 Function: Get the next result set from parser data
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
104 Returns : Bio::SeqFeature::Generic
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
105 Args : none
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
106
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
107
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
108 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
109
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
110 sub next_result {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
111 my ($self) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
112
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
113 my $line;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
114
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
115 # parse
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
116 my $id;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
117 while ($_=$self->_readline()) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
118 $line = $_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
119 chomp $line;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
120
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
121
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
122 next if /^$/;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
123 if ($line=~/^#\s+(\S+)/) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
124 #if the line starts with a '#' for example in # 13 Length: 522
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
125 #assign 13 as the id.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
126
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
127 $id = $1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
128 my ($junk, $values) = split /:/;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
129 $self->_seqname($id);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
130 next;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
131 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
132
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
133 elsif ($line=~/^(\S+)\s+(\S+)\s+(\w+)\s+(\d+)\s+(\d+)/) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
134
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
135 # Example :- 13 TMHMM2.0 inside 1 120
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
136 # assign $orien(inside) $start(1) and $end(120)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
137
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
138
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
139 my $orien = $3;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
140 my $start = $4;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
141 my $end = $5;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
142 $orien = uc ($orien);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
143
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
144 if ($orien eq "TMHELIX") {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
145 my (%feature);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
146 $feature{name} = $self->_seqname;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
147 $feature{start} = $start;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
148 $feature{end} = $end;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
149 $feature{source} ='tmhmm';
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
150 $feature{primary}= 'transmembrane';
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
151 $feature{program} ='tmhmm';
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
152 $feature{logic_name} = 'TMHelix';
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
153 my $new_feat= $self->create_feature(\%feature);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
154 return $new_feat;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
155 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
156 next;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
157 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
158 next;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
159 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
160 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
161
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
162 =head2 create_feature
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
163
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
164 Title : create_feature
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
165 Usage : obj->create_feature(\%feature)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
166 Function: Internal(not to be used directly)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
167 Returns : A Bio::SeqFeature::Generic object
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
168 Args :
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
169
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
170 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
171
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
172 sub create_feature {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
173 my ($self, $feat) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
174
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
175
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
176 # create feature object
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
177 my $feature = Bio::SeqFeature::Generic->new(-seq_id => $feat->{name},
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
178 -start => $feat->{start},
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
179 -end => $feat->{end},
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
180 -score => $feat->{score},
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
181 -source => $feat->{source},
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
182 -primary => $feat->{primary},
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
183 -logic_name => $feat->{logic_name},
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
184 );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
185 return $feature;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
186 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
187
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
188 =head2 _seqname
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
189
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
190 Title : _seqname
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
191 Usage : obj->_seqname($seqname)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
192 Function: Internal(not to be used directly)
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
193 Returns :
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
194 Args : seqname
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
195
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
196 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
197
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
198 sub _seqname{
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
199 my ($self,$seqname)=@_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
200
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
201 if (defined $seqname){
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
202
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
203 $self->{'seqname'}=$seqname;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
204 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
205
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
206 return $self->{'seqname'};
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
207
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
208 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
209
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
210
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
211 1;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
212
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
213