annotate variant_effect_predictor/Bio/SeqIO/fastq.pm @ 0:1f6dce3d34e0

Uploaded
author mahtabm
date Thu, 11 Apr 2013 02:01:53 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
1 # BioPerl module for Bio::SeqIO::fastq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
2 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
3 # Cared for by Tony Cox <avc@sanger.ac.uk>
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
4 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
5 # Copyright Tony Cox
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
6 #
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
7 # You may distribute this module under the same terms as perl itself
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
8 # _history
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
9 # October 29, 2001 incept data
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
10
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
11 # POD documentation - main docs before the code
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
12
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
13 =head1 NAME
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
14
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
15 Bio::SeqIO::fastq - fastq sequence input/output stream
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
16
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
17 =head1 SYNOPSIS
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
18
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
19 Do not use this module directly. Use it via the Bio::SeqIO class.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
20
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
21 =head1 DESCRIPTION
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
22
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
23 This object can transform Bio::Seq and Bio::Seq::SeqWithQuality
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
24 objects to and from fastq flat file databases.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
25
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
26 Fastq is a file format used frequently at the Sanger Centre to bundle
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
27 a fasta sequence and its quality data. A typical fastaq entry takes
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
28 the from:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
29
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
30 @HCDPQ1D0501
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
31 GATTTGGGGTTCAAAGCAGTATCGATCAAATAGTAAATCCATTTGTTCAACTCACAGTTT.....
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
32 +HCDPQ1D0501
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
33 !''*((((***+))%%%++)(%%%%).1***-+*''))**55CCF>>>>>>CCCCCCC65.....
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
34
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
35 Fastq files have sequence and quality data on a single line and the
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
36 quality values are single-byte encoded. To retrieve the decimal values
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
37 for qualities you need to subtract 33 (or Octal 41) from each byte and
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
38 then convert to a '2 digit + 1 space' integer. You can check if 33 is
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
39 the right number because the first byte which is always '!'
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
40 corresponds to a quality value of 0.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
41
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
42 =head1 FEEDBACK
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
43
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
44 =head2 Mailing Lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
45
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
46 User feedback is an integral part of the evolution of this and other
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
47 Bioperl modules. Send your comments and suggestions preferably to one
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
48 of the Bioperl mailing lists. Your participation is much appreciated.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
49
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
50 bioperl-l@bioperl.org - General discussion
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
51 http://bioperl.org/MailList.shtml - About the mailing lists
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
52
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
53 =head2 Reporting Bugs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
54
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
55 Report bugs to the Bioperl bug tracking system to help us keep track
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
56 the bugs and their resolution.
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
57 Bug reports can be submitted via email or the web:
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
58
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
59 bioperl-bugs@bio.perl.org
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
60 http://bugzilla.bioperl.org/
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
61
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
62 =head1 AUTHORS - Tony Cox
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
63
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
64 Email: avc@sanger.ac.uk
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
65
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
66
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
67 =head1 APPENDIX
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
68
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
69 The rest of the documentation details each of the object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
70 methods. Internal methods are usually preceded with a _
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
71
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
72 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
73
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
74 # Let the code begin...
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
75
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
76 package Bio::SeqIO::fastq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
77 use vars qw(@ISA);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
78 use strict;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
79 # Object preamble - inherits from Bio::Root::Object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
80
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
81 use Bio::SeqIO;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
82 use Bio::Seq::SeqFactory;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
83
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
84 @ISA = qw(Bio::SeqIO);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
85
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
86 sub _initialize {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
87 my($self,@args) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
88 $self->SUPER::_initialize(@args);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
89 if( ! defined $self->sequence_factory ) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
90 $self->sequence_factory(new Bio::Seq::SeqFactory(-verbose => $self->verbose(), -type => 'Bio::Seq::SeqWithQuality'));
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
91 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
92 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
93
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
94
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
95 =head2 next_seq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
96
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
97 Title : next_seq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
98 Usage : $seq = $stream->next_seq()
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
99 Function: returns the next sequence in the stream
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
100 Returns : Bio::Seq::SeqWithQuality object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
101 Args : NONE
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
102
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
103 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
104
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
105 sub next_seq {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
106
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
107 my( $self ) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
108 my $seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
109 my $alphabet;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
110 local $/ = "\n\@";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
111
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
112 return unless my $entry = $self->_readline;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
113
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
114 if ($entry eq '@') { # very first one
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
115 return unless $entry = $self->_readline;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
116 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
117 my ($top,$sequence,$top2,$qualsequence) = $entry =~ /^
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
118 \@?(.+?)\n
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
119 ([^\@]*?)\n
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
120 \+?(.+?)\n
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
121 (.*)\n
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
122 /xs
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
123 or $self->throw("Can't parse fastq entry");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
124 my ($id,$fulldesc) = $top =~ /^\s*(\S+)\s*(.*)/
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
125 or $self->throw("Can't parse fastq header");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
126 if ($id eq '') {$id=$fulldesc;} # FIX incase no space between \@ and name
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
127 $sequence =~ s/\s//g; # Remove whitespace
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
128 $qualsequence =~ s/\s//g;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
129
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
130 if(length($sequence) != length($qualsequence)){
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
131 $self->warn("Fastq sequence/quality data length mismatch error\n");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
132 $self->warn("Sequence: $top, seq length: ",length($sequence), " Qual length: ", length($qualsequence), " \n");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
133 $self->warn("$sequence\n");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
134 $self->warn("$qualsequence\n");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
135 $self->warn("FROM ENTRY: \n\n$entry\n");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
136 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
137
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
138 my @qual = split('', $qualsequence);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
139
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
140 my $qual;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
141 foreach (@qual) {$qual .= (unpack("C",$_) - 33) ." "};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
142
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
143
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
144 # for empty sequences we need to know the mol.type
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
145 $alphabet = $self->alphabet();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
146 if(length($sequence) == 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
147 if(! defined($alphabet)) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
148 # let's default to dna
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
149 $alphabet = "dna";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
150 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
151 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
152 # we don't need it really, so disable
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
153 $alphabet = undef;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
154 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
155
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
156 # create the SeqWithQuality object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
157 $seq = $self->sequence_factory->create(
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
158 -qual => $qual,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
159 -seq => $sequence,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
160 -id => $id,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
161 -primary_id => $id,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
162 -desc => $fulldesc,
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
163 -alphabet => $alphabet
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
164 );
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
165
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
166 # if there wasn't one before, set the guessed type
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
167 $self->alphabet($seq->alphabet());
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
168
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
169 return $seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
170 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
171
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
172 =head2 write_seq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
173
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
174 Title : write_seq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
175 Usage : $stream->write_seq(@seq)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
176 Function: writes the $seq object into the stream
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
177 Returns : 1 for success and 0 for error
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
178 Args : Bio::Seq::SeqWithQuality or Bio::seq object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
179
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
180
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
181 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
182
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
183 sub write_seq {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
184 my ($self,@seq) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
185 foreach my $seq (@seq) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
186 my $str = $seq->seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
187 my $top = $seq->display_id();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
188 if ($seq->can('desc') and my $desc = $seq->desc()) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
189 $desc =~ s/\n//g;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
190 $top .= " $desc";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
191 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
192 if(length($str) > 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
193 $str =~ s/(.{1,60})/$1\n/g;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
194 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
195 $str = "\n";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
196 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
197
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
198 $self->_print (">",$top,"\n",$str) or return;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
199 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
200
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
201 $self->flush if $self->_flush_on_write && defined $self->_fh;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
202 return 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
203 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
204
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
205 =head2 write_qual
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
206
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
207 Title : write_qual
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
208 Usage : $stream->write_qual(@seq)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
209 Function: writes the $seq object into the stream
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
210 Returns : 1 for success and 0 for error
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
211 Args : Bio::Seq::SeqWithQuality object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
212
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
213
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
214 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
215
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
216 sub write_qual {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
217 my ($self,@seq) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
218 foreach my $seq (@seq) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
219 unless ($seq->isa("Bio::Seq::SeqWithQuality")){
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
220 warn("You can write FASTQ without supplying a Bio::Seq::SeqWithQuality object! ", ref($seq), "\n");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
221 next;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
222 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
223 my @qual = @{$seq->qual};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
224 my $top = $seq->display_id();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
225 if ($seq->can('desc') and my $desc = $seq->desc()) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
226 $desc =~ s/\n//g;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
227 $top .= " $desc";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
228 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
229 my $qual = "" ;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
230 if(scalar(@qual) > 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
231 my $max = 60;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
232 for (my $q = 0;$q<scalar(@qual);$q++){
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
233 $qual .= $qual[$q] . " ";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
234 if(length($qual) > $max){
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
235 $qual .= "\n";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
236 $max += 60;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
237 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
238 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
239 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
240 $qual = "\n";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
241 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
242
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
243 $self->_print (">",$top,"\n",$qual,"\n") or return;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
244 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
245 return 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
246 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
247
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
248 =head2 write_fastq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
249
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
250 Title : write_fastq
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
251 Usage : $stream->write_fastq(@seq)
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
252 Function: writes the $seq object into the stream
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
253 Returns : 1 for success and 0 for error
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
254 Args : Bio::Seq::SeqWithQuality object
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
255
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
256
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
257 =cut
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
258
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
259 sub write_fastq {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
260 my ($self,@seq) = @_;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
261 foreach my $seq (@seq) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
262 unless ($seq->isa("Bio::Seq::SeqWithQuality")){
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
263 warn("You can write FASTQ without supplying a Bio::Seq::SeqWithQuality object! ", ref($seq), "\n");
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
264 next;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
265 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
266 my $str = $seq->seq;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
267 my @qual = @{$seq->qual};
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
268 my $top = $seq->display_id();
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
269 if ($seq->can('desc') and my $desc = $seq->desc()) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
270 $desc =~ s/\n//g;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
271 $top .= " $desc";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
272 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
273 if(length($str) == 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
274 $str = "\n";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
275 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
276 my $qual = "" ;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
277 if(scalar(@qual) > 0) {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
278 for (my $q = 0;$q<scalar(@qual);$q++){
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
279 $qual .= chr($qual[$q] + 33);
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
280 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
281 } else {
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
282 $qual = "\n";
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
283 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
284
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
285 $self->_print ("\@",$top,"\n",$str,"\n") or return;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
286 $self->_print ("+",$top,"\n",$qual,"\n") or return;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
287 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
288 return 1;
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
289 }
1f6dce3d34e0 Uploaded
mahtabm
parents:
diff changeset
290 1;