Mercurial > repos > mahtabm > ensembl
diff variant_effect_predictor/Bio/Tools/EPCR.pm @ 0:1f6dce3d34e0
Uploaded
author | mahtabm |
---|---|
date | Thu, 11 Apr 2013 02:01:53 -0400 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/variant_effect_predictor/Bio/Tools/EPCR.pm Thu Apr 11 02:01:53 2013 -0400 @@ -0,0 +1,152 @@ +# $Id: EPCR.pm,v 1.8 2002/12/01 00:05:21 jason Exp $ +# +# BioPerl module for Bio::Tools::EPCR +# +# Cared for by Jason Stajich <jason@bioperl.org> +# +# Copyright Jason Stajich +# +# You may distribute this module under the same terms as perl itself + +# POD documentation - main docs before the code + +=head1 NAME + +Bio::Tools::EPCR - Parse ePCR output and make features + +=head1 SYNOPSIS + + # A simple annotation pipeline wrapper for ePCR data + # assuming ePCR data is already generated in file seq1.epcr + # and sequence data is in fasta format in file called seq1.fa + + use Bio::Tools::EPCR; + use Bio::SeqIO; + my $parser = new Bio::Tools::EPCR(-file => 'seq1.epcr'); + my $seqio = new Bio::SeqIO(-format => 'fasta', -file => 'seq1.fa'); + my $seq = $seqio->next_seq || die("cannot get a seq object from SeqIO"); + + while( my $feat = $parser->next_feature ) { + # add EPCR annotation to a sequence + $seq->add_SeqFeature($feat); + } + my $seqout = new Bio::SeqIO(-format => 'embl'); + $seqout->write_seq($seq); + + +=head1 DESCRIPTION + +This object serves as a parser for ePCR data, creating a +Bio::SeqFeatureI for each ePCR hit. These can be processed or added +as annotation to an existing Bio::SeqI object for the purposes of +automated annotation. + +=head1 FEEDBACK + +=head2 Mailing Lists + +User feedback is an integral part of the evolution of this and other +Bioperl modules. Send your comments and suggestions preferably to +the Bioperl mailing list. Your participation is much appreciated. + + bioperl-l@bioperl.org - General discussion +http://bioperl.org/MailList.shtml - About the mailing lists + +=head2 Reporting Bugs + +Report bugs to the Bioperl bug tracking system to help us keep track +of the bugs and their resolution. Bug reports can be submitted via +email or the web: + + bioperl-bugs@bioperl.org + http://bugzilla.bioperl.org/ + +=head1 AUTHOR - Jason Stajich + +Email jason@bioperl.org + +Describe contact details here + +=head1 APPENDIX + +The rest of the documentation details each of the object methods. +Internal methods are usually preceded with a _ + +=cut + + +# Let the code begin... + + +package Bio::Tools::EPCR; +use vars qw(@ISA); +use strict; + +use Bio::Root::Root; +use Bio::SeqAnalysisParserI; +use Bio::SeqFeature::FeaturePair; +use Bio::SeqFeature::Generic; + +@ISA = qw(Bio::Root::Root Bio::SeqAnalysisParserI Bio::Root::IO ); + +=head2 new + + Title : new + Usage : my $epcr = new Bio::Tools::EPCR(-file => $file); + Function: Initializes a new EPCR parser + Returns : Bio::Tools::EPCR + Args : -fh => filehandle + OR + -file => filename + +=cut + +sub new { + my($class,@args) = @_; + + my $self = $class->SUPER::new(@args); + $self->_initialize_io(@args); + + return $self; +} + +=head2 next_feature + + Title : next_feature + Usage : $seqfeature = $obj->next_feature(); + Function: Returns the next feature available in the analysis result, or + undef if there are no more features. + Example : + Returns : A Bio::SeqFeatureI implementing object, or undef if there are no + more features. + Args : none + +=cut + +sub next_feature { + my ($self) = @_; + my $line = $self->_readline; + return undef unless defined($line); + chomp($line); + my($seqname,$location,$mkrname, $rest) = split(/\s+/,$line,4); + + my ($start,$end) = ($location =~ /(\S+)\.\.(\S+)/); + + # If we require that e-PCR is run with D=1 we can detect a strand + # for now hardcoded to 0 + + my $strand = 0; + my $markerfeature = new Bio::SeqFeature::Generic ( '-start' => $start, + '-end' => $end, + '-strand' => $strand, + '-source' => 'e-PCR', + '-primary' => 'sts', + '-seq_id' => $seqname, + '-tag' => { + 'name'=> $mkrname, + 'note'=> $rest, + }); + return $markerfeature; +} + +1;