annotate variant_effect_predictor/Bio/Tools/EPCR.pm @ 3:d30fa12e4cc5 default tip

Merge heads 2:a5976b2dce6f and 1:09613ce8151e which were created as a result of a recently fixed bug.
author devteam <devteam@galaxyproject.org>
date Mon, 13 Jan 2014 10:38:30 -0500
parents 1f6dce3d34e0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 # $Id: EPCR.pm,v 1.8 2002/12/01 00:05:21 jason Exp $
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 # BioPerl module for Bio::Tools::EPCR
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5 # Cared for by Jason Stajich <jason@bioperl.org>
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7 # Copyright Jason Stajich
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9 # You may distribute this module under the same terms as perl itself
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11 # POD documentation - main docs before the code
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13 =head1 NAME
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15 Bio::Tools::EPCR - Parse ePCR output and make features
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19 # A simple annotation pipeline wrapper for ePCR data
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20 # assuming ePCR data is already generated in file seq1.epcr
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21 # and sequence data is in fasta format in file called seq1.fa
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23 use Bio::Tools::EPCR;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24 use Bio::SeqIO;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25 my $parser = new Bio::Tools::EPCR(-file => 'seq1.epcr');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26 my $seqio = new Bio::SeqIO(-format => 'fasta', -file => 'seq1.fa');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27 my $seq = $seqio->next_seq || die("cannot get a seq object from SeqIO");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29 while( my $feat = $parser->next_feature ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30 # add EPCR annotation to a sequence
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31 $seq->add_SeqFeature($feat);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33 my $seqout = new Bio::SeqIO(-format => 'embl');
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34 $seqout->write_seq($seq);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37 =head1 DESCRIPTION
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39 This object serves as a parser for ePCR data, creating a
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40 Bio::SeqFeatureI for each ePCR hit. These can be processed or added
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41 as annotation to an existing Bio::SeqI object for the purposes of
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42 automated annotation.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44 =head1 FEEDBACK
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46 =head2 Mailing Lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48 User feedback is an integral part of the evolution of this and other
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49 Bioperl modules. Send your comments and suggestions preferably to
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50 the Bioperl mailing list. Your participation is much appreciated.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52 bioperl-l@bioperl.org - General discussion
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53 http://bioperl.org/MailList.shtml - About the mailing lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55 =head2 Reporting Bugs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57 Report bugs to the Bioperl bug tracking system to help us keep track
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58 of the bugs and their resolution. Bug reports can be submitted via
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59 email or the web:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61 bioperl-bugs@bioperl.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62 http://bugzilla.bioperl.org/
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64 =head1 AUTHOR - Jason Stajich
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66 Email jason@bioperl.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68 Describe contact details here
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70 =head1 APPENDIX
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72 The rest of the documentation details each of the object methods.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73 Internal methods are usually preceded with a _
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78 # Let the code begin...
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81 package Bio::Tools::EPCR;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82 use vars qw(@ISA);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85 use Bio::Root::Root;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86 use Bio::SeqAnalysisParserI;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87 use Bio::SeqFeature::FeaturePair;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88 use Bio::SeqFeature::Generic;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90 @ISA = qw(Bio::Root::Root Bio::SeqAnalysisParserI Bio::Root::IO );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92 =head2 new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94 Title : new
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95 Usage : my $epcr = new Bio::Tools::EPCR(-file => $file);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96 Function: Initializes a new EPCR parser
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97 Returns : Bio::Tools::EPCR
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98 Args : -fh => filehandle
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99 OR
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100 -file => filename
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104 sub new {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105 my($class,@args) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107 my $self = $class->SUPER::new(@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108 $self->_initialize_io(@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110 return $self;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113 =head2 next_feature
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115 Title : next_feature
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116 Usage : $seqfeature = $obj->next_feature();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117 Function: Returns the next feature available in the analysis result, or
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118 undef if there are no more features.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119 Example :
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120 Returns : A Bio::SeqFeatureI implementing object, or undef if there are no
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121 more features.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122 Args : none
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126 sub next_feature {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127 my ($self) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128 my $line = $self->_readline;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129 return undef unless defined($line);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130 chomp($line);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131 my($seqname,$location,$mkrname, $rest) = split(/\s+/,$line,4);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133 my ($start,$end) = ($location =~ /(\S+)\.\.(\S+)/);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135 # If we require that e-PCR is run with D=1 we can detect a strand
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136 # for now hardcoded to 0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 my $strand = 0;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139 my $markerfeature = new Bio::SeqFeature::Generic ( '-start' => $start,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 '-end' => $end,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141 '-strand' => $strand,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142 '-source' => 'e-PCR',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143 '-primary' => 'sts',
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144 '-seq_id' => $seqname,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145 '-tag' => {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146 'name'=> $mkrname,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147 'note'=> $rest,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148 });
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149 return $markerfeature;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152 1;