Mercurial > repos > mahtabm > ensemb_rep_gvl
diff variant_effect_predictor/Bio/AlignIO/pfam.pm @ 0:2bc9b66ada89 draft default tip
Uploaded
author | mahtabm |
---|---|
date | Thu, 11 Apr 2013 06:29:17 -0400 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/variant_effect_predictor/Bio/AlignIO/pfam.pm Thu Apr 11 06:29:17 2013 -0400 @@ -0,0 +1,154 @@ +# $Id: pfam.pm,v 1.10 2002/10/22 07:38:26 lapp Exp $ +# +# BioPerl module for Bio::AlignIO::pfam + +# based on the Bio::SeqIO:: modules +# by Ewan Birney <birney@sanger.ac.uk> +# and Lincoln Stein <lstein@cshl.org> +# +# and the SimpleAlign.pm module of Ewan Birney +# +# Copyright Peter Schattner +# +# You may distribute this module under the same terms as perl itself +# _history +# September 5, 2000 +# POD documentation - main docs before the code + +=head1 NAME + +Bio::AlignIO::pfam - pfam sequence input/output stream + +=head1 SYNOPSIS + +Do not use this module directly. Use it via the L<Bio::AlignIO> class. + +=head1 DESCRIPTION + +This object can transform Bio::SimpleAlign objects to and from pfam flat +file databases. + +=head1 FEEDBACK + +=head2 Reporting Bugs + +Report bugs to the Bioperl bug tracking system to help us keep track + the bugs and their resolution. + Bug reports can be submitted via email or the web: + + bioperl-bugs@bio.perl.org + http://bugzilla.bioperl.org/ + +=head1 AUTHORS - Peter Schattner + +Email: schattner@alum.mit.edu + + +=head1 APPENDIX + +The rest of the documentation details each of the object +methods. Internal methods are usually preceded with a _ + +=cut + +# Let the code begin... + +package Bio::AlignIO::pfam; +use vars qw(@ISA); +use strict; + +use Bio::AlignIO; +use Bio::SimpleAlign; +@ISA = qw(Bio::AlignIO); + +=head2 next_aln + + Title : next_aln + Usage : $aln = $stream->next_aln() + Function: returns the next alignment in the stream + Returns : L<Bio::Align::AlignI> object + Args : NONE + +=cut + +sub next_aln { + my $self = shift; + my $entry; + my $name; + my $start; + my $end; + my $seq; + my $add; + my $acc; + my %names; + + my $aln = Bio::SimpleAlign->new(-source => 'pfam'); + + while( $entry = $self->_readline) { + chomp $entry; + $entry =~ /^\/\// && last; + if($entry !~ /^(\S+)\/(\d+)-(\d+)\s+(\S+)\s*/ ) { + $self->throw("Found a bad line [$_] in the pfam format alignment"); + next; + } + + $name = $1; + $start = $2; + $end = $3; + $seq = $4; + + + $add = new Bio::LocatableSeq('-seq'=>$seq, + '-id'=>$name, + '-start'=>$start, + '-end'=>$end, + ); + + $aln->add_seq($add); + + } + +# If $end <= 0, we have either reached the end of +# file in <> or we have encountered some other error +# + if ($end <= 0) { undef $aln;} + + return $aln; +} + + + +=head2 write_aln + + Title : write_aln + Usage : $stream->write_aln(@aln) + Function: writes the $aln object into the stream + Returns : 1 for success and 0 for error + Args : L<Bio::Align::AlignI> object + + +=cut + +sub write_aln { + my ($self,@aln) = @_; + if( @aln > 1 ) { $self->warn("Only the 1st pfam alignment will be output since the format does not support multiple alignments in the same file"); } + my $aln = shift @aln; + if( ! $aln || ! $aln->isa('Bio::Align::AlignI') ) { + $self->warn("Must provide a Bio::Align::AlignI object when calling write_aln"); + next; + } + my ($namestr,$seq,$add); + my ($maxn); + $maxn = $aln->maxdisplayname_length(); + + foreach $seq ( $aln->each_seq() ) { + $namestr = $aln->displayname($seq->get_nse()); + $add = $maxn - length($namestr) + 2; + $namestr .= " " x $add; + $self->_print (sprintf("%s %s\n",$namestr,$seq->seq())) or return; + } + $self->flush() if $self->_flush_on_write && defined $self->_fh; + return 1; +} + +1;