diff variant_effect_predictor/Bio/Tools/Signalp.pm @ 0:2bc9b66ada89 draft default tip

Uploaded
author mahtabm
date Thu, 11 Apr 2013 06:29:17 -0400
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/variant_effect_predictor/Bio/Tools/Signalp.pm	Thu Apr 11 06:29:17 2013 -0400
@@ -0,0 +1,251 @@
+# Parser module for SignalP Bio::Tools::Signalp
+#
+# Based on the EnsEMBL module Bio::EnsEMBL::Pipeline::Runnable::Protein::Signalp
+# originally written by Marc Sohrmann (ms2@sanger.ac.uk)
+# Written in BioPipe by Balamurugan Kumarasamy <savikalpa@fugu-sg.org>
+# Cared for by the Fugu Informatics team (fuguteam@fugu-sg.org)
+
+# You may distribute this module under the same terms as perl itself
+#
+# POD documentation - main docs before the code
+
+=head1 NAME
+
+Bio::Tools::SignalP
+
+=head1 SYNOPSIS
+
+ use Bio::Tools::SignalP;
+ my $parser = new Bio::Tools::SignalP(-fh =>$filehandle );
+ while( my $sp_feat = $parser->next_result ) {
+       #do something
+       #eg
+       push @sp_feat, $sp_feat;
+ }
+
+=head1 DESCRIPTION
+
+ Parser for SignalP output
+
+=head1 FEEDBACK
+
+=head2 Mailing Lists
+
+ User feedback is an integral part of the evolution of this and other
+ Bioperl modules. Send your comments and suggestions preferably to
+ the Bioperl mailing list.  Your participation is much appreciated.
+
+ bioperl-l@bioperl.org              - General discussion
+ http://bioperl.org/MailList.shtml  - About the mailing lists
+
+=head2 Reporting Bugs
+
+ Report bugs to the Bioperl bug tracking system to help us keep track
+ of the bugs and their resolution. Bug reports can be submitted via
+ email or the web:
+
+ bioperl-bugs@bio.perl.org
+ http://bugzilla.bioperl.org/
+
+=head1 AUTHOR
+
+ Based on the EnsEMBL module Bio::EnsEMBL::Pipeline::Runnable::Protein::Signalp
+ originally written by Marc Sohrmann (ms2@sanger.ac.uk)
+ Written in BioPipe by Balamurugan Kumarasamy <savikalpa@fugu-sg.org>
+ Cared for by the Fugu Informatics team (fuguteam@fugu-sg.org)
+
+=head1 APPENDIX
+
+ The rest of the documentation details each of the object methods.
+ Internal methods are usually preceded with a _
+
+
+=cut
+
+package Bio::Tools::Signalp;
+use vars qw(@ISA);
+use strict;
+
+use Bio::Root::Root;
+use Bio::SeqFeature::FeaturePair;
+use Bio::Root::IO;
+use Bio::SeqFeature::Generic;
+@ISA = qw(Bio::Root::Root Bio::Root::IO );
+
+
+
+=head2 new
+
+ Title   : new
+ Usage   : my $obj = new Bio::Tools::SignalP();
+ Function: Builds a new Bio::Tools::SignalP object
+ Returns : Bio::Tools::SignalP
+ Args    : -fh/-file => $val, # for initing input, see Bio::Root::IO
+
+
+=cut
+
+sub new {
+      my($class,@args) = @_;
+
+      my $self = $class->SUPER::new(@args);
+      $self->_initialize_io(@args);
+
+      return $self;
+}
+
+=head2 next_result
+
+ Title   : next_result
+ Usage   : my $feat = $signalp->next_result
+ Function: Get the next result set from parser data
+ Returns : Bio::SeqFeature::Generic
+ Args    : none
+
+
+=cut
+
+sub next_result {
+        my ($self) = @_;
+        
+        my $line;
+        # parse
+        my $id;
+        my ( $fact1, $fact2, $end);
+        while ($_=$self->_readline()) {
+           $line = $_;
+           chomp $line;
+           
+           if ($line=~/^\>(\S+)/) {
+              $id = $1;
+              $self->seqname($id);
+              next;
+           }
+           elsif ($line=~/max\.\s+Y\s+(\S+)\s+\S+\s+\S+\s+(\S+)/) {
+              $fact1 = $2;
+              $self->fact1($fact1);
+              next;
+           }
+           elsif ($line=~/mean\s+S\s+(\S+)\s+\S+\s+\S+\s+(\S+)/) {
+              $fact2 = $2;
+                 $fact1 = $self->fact1;
+                 $id = $self->seqname;
+              
+              if ($fact1 eq "YES" && $fact2 eq "YES") {
+                  
+                  my $line = $self->_readline();
+              
+                  if ($line =~ /Most likely cleavage site between pos\.\s+(\d+)/) {
+                      $end = $1;
+                  }
+                  else {
+                      $self->throw ("parsing problem in signalp");
+                  }
+                  my (%feature);
+                  $feature{name} = $id;
+                  $feature{start} = 1;
+                  $feature{end} = $end;
+                  $feature{source} = 'Signalp';
+                  $feature{primary}= 'signal_peptide';
+                  $feature{program} = 'Signalp';
+                  $feature{logic_name} = 'signal_peptide';
+                  
+                  my $new_feat = $self->create_feature (\%feature);
+                  return $new_feat;
+                  
+              }
+               next;
+               
+           }
+        
+           next;
+        
+        }
+        
+}
+
+=head2 create_feature
+
+ Title   : create_feature
+ Usage   : obj->create_feature(\%feature)
+ Function: Internal(not to be used directly)
+ Returns :
+ Args    :
+
+
+=cut
+
+sub create_feature {
+       my ($self, $feat) = @_;
+
+
+       # create feature object
+       my $feature = Bio::SeqFeature::Generic->new(
+                                                 -seq_id=>$feat->{name},
+                                                 -start       => $feat->{start},
+                                                 -end         => $feat->{end},
+                                                 -score       => $feat->{score},
+                                                 -source      => $feat->{source},
+                                                 -primary     => $feat->{primary},
+                                                 -logic_name  => $feat->{logic_name}, 
+                                               );
+           
+
+          $feature->add_tag_value('evalue',0);
+          $feature->add_tag_value('percent_id','NULL');
+          $feature->add_tag_value("hid",$feat->{primary});
+          
+          return $feature; 
+
+}
+=head2 seqname
+
+ Title   : seqname
+ Usage   : obj->seqname($name)
+ Function: Internal(not to be used directly)
+ Returns :
+ Args    :
+
+
+=cut
+
+sub seqname{
+    my ($self,$seqname)=@_;
+
+    if (defined$seqname){
+
+        $self->{'seqname'}=$seqname;
+    }
+
+    return $self->{'seqname'};
+
+}
+
+=head2 fact1
+
+ Title   : fact1
+ Usage   : obj->fact1($fact1)
+ Function: Internal(not to be used directly)
+ Returns :
+ Args    :
+
+
+=cut
+
+sub fact1{
+    my ($self,$fact1)=@_;
+
+    if (defined$fact1){
+
+       $self->{'fact1'}=$fact1;
+    }
+
+    return $self->{'fact1'};
+
+}
+
+
+
+1;
+
+