annotate variant_effect_predictor/Bio/Tools/EPCR.pm @ 1:d6778b5d8382 draft default tip

Deleted selected files
author willmclaren
date Fri, 03 Aug 2012 10:05:43 -0400
parents 21066c0abaf5
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
1 # $Id: EPCR.pm,v 1.8 2002/12/01 00:05:21 jason Exp $
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
2 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
3 # BioPerl module for Bio::Tools::EPCR
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
4 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
5 # Cared for by Jason Stajich <jason@bioperl.org>
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
6 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
7 # Copyright Jason Stajich
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
8 #
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
9 # You may distribute this module under the same terms as perl itself
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
10
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
11 # POD documentation - main docs before the code
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
12
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
13 =head1 NAME
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
14
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
15 Bio::Tools::EPCR - Parse ePCR output and make features
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
16
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
17 =head1 SYNOPSIS
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
18
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
19 # A simple annotation pipeline wrapper for ePCR data
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
20 # assuming ePCR data is already generated in file seq1.epcr
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
21 # and sequence data is in fasta format in file called seq1.fa
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
22
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
23 use Bio::Tools::EPCR;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
24 use Bio::SeqIO;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
25 my $parser = new Bio::Tools::EPCR(-file => 'seq1.epcr');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
26 my $seqio = new Bio::SeqIO(-format => 'fasta', -file => 'seq1.fa');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
27 my $seq = $seqio->next_seq || die("cannot get a seq object from SeqIO");
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
28
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
29 while( my $feat = $parser->next_feature ) {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
30 # add EPCR annotation to a sequence
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
31 $seq->add_SeqFeature($feat);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
32 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
33 my $seqout = new Bio::SeqIO(-format => 'embl');
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
34 $seqout->write_seq($seq);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
35
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
36
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
37 =head1 DESCRIPTION
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
38
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
39 This object serves as a parser for ePCR data, creating a
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
40 Bio::SeqFeatureI for each ePCR hit. These can be processed or added
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
41 as annotation to an existing Bio::SeqI object for the purposes of
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
42 automated annotation.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
43
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
44 =head1 FEEDBACK
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
45
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
46 =head2 Mailing Lists
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
47
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
48 User feedback is an integral part of the evolution of this and other
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
49 Bioperl modules. Send your comments and suggestions preferably to
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
50 the Bioperl mailing list. Your participation is much appreciated.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
51
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
52 bioperl-l@bioperl.org - General discussion
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
53 http://bioperl.org/MailList.shtml - About the mailing lists
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
54
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
55 =head2 Reporting Bugs
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
56
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
57 Report bugs to the Bioperl bug tracking system to help us keep track
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
58 of the bugs and their resolution. Bug reports can be submitted via
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
59 email or the web:
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
60
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
61 bioperl-bugs@bioperl.org
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
62 http://bugzilla.bioperl.org/
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
63
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
64 =head1 AUTHOR - Jason Stajich
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
65
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
66 Email jason@bioperl.org
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
67
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
68 Describe contact details here
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
69
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
70 =head1 APPENDIX
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
71
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
72 The rest of the documentation details each of the object methods.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
73 Internal methods are usually preceded with a _
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
74
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
75 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
76
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
77
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
78 # Let the code begin...
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
79
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
80
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
81 package Bio::Tools::EPCR;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
82 use vars qw(@ISA);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
83 use strict;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
84
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
85 use Bio::Root::Root;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
86 use Bio::SeqAnalysisParserI;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
87 use Bio::SeqFeature::FeaturePair;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
88 use Bio::SeqFeature::Generic;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
89
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
90 @ISA = qw(Bio::Root::Root Bio::SeqAnalysisParserI Bio::Root::IO );
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
91
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
92 =head2 new
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
93
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
94 Title : new
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
95 Usage : my $epcr = new Bio::Tools::EPCR(-file => $file);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
96 Function: Initializes a new EPCR parser
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
97 Returns : Bio::Tools::EPCR
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
98 Args : -fh => filehandle
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
99 OR
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
100 -file => filename
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
101
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
102 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
103
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
104 sub new {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
105 my($class,@args) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
106
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
107 my $self = $class->SUPER::new(@args);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
108 $self->_initialize_io(@args);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
109
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
110 return $self;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
111 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
112
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
113 =head2 next_feature
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
114
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
115 Title : next_feature
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
116 Usage : $seqfeature = $obj->next_feature();
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
117 Function: Returns the next feature available in the analysis result, or
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
118 undef if there are no more features.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
119 Example :
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
120 Returns : A Bio::SeqFeatureI implementing object, or undef if there are no
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
121 more features.
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
122 Args : none
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
123
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
124 =cut
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
125
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
126 sub next_feature {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
127 my ($self) = @_;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
128 my $line = $self->_readline;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
129 return undef unless defined($line);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
130 chomp($line);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
131 my($seqname,$location,$mkrname, $rest) = split(/\s+/,$line,4);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
132
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
133 my ($start,$end) = ($location =~ /(\S+)\.\.(\S+)/);
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
134
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
135 # If we require that e-PCR is run with D=1 we can detect a strand
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
136 # for now hardcoded to 0
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
137
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
138 my $strand = 0;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
139 my $markerfeature = new Bio::SeqFeature::Generic ( '-start' => $start,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
140 '-end' => $end,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
141 '-strand' => $strand,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
142 '-source' => 'e-PCR',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
143 '-primary' => 'sts',
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
144 '-seq_id' => $seqname,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
145 '-tag' => {
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
146 'name'=> $mkrname,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
147 'note'=> $rest,
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
148 });
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
149 return $markerfeature;
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
150 }
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
151
21066c0abaf5 Uploaded
willmclaren
parents:
diff changeset
152 1;