annotate genome_diversity.py @ 0:c3ba43704319 draft default tip

Uploaded
author rico
date Wed, 12 Sep 2012 14:35:13 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
c3ba43704319 Uploaded
rico
parents:
diff changeset
1 #!/usr/bin/env python
c3ba43704319 Uploaded
rico
parents:
diff changeset
2
c3ba43704319 Uploaded
rico
parents:
diff changeset
3 import sys
c3ba43704319 Uploaded
rico
parents:
diff changeset
4 import cdblib
c3ba43704319 Uploaded
rico
parents:
diff changeset
5
c3ba43704319 Uploaded
rico
parents:
diff changeset
6 def _openfile( filename=None, mode='r' ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
7 try:
c3ba43704319 Uploaded
rico
parents:
diff changeset
8 fh = open( filename, mode )
c3ba43704319 Uploaded
rico
parents:
diff changeset
9 except IOError, err:
c3ba43704319 Uploaded
rico
parents:
diff changeset
10 raise RuntimeError( "can't open file: %s\n" % str( err ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
11 return fh
c3ba43704319 Uploaded
rico
parents:
diff changeset
12
c3ba43704319 Uploaded
rico
parents:
diff changeset
13 def get_filename_from_loc( species=None, filename=None ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
14 fh = _openfile( filename )
c3ba43704319 Uploaded
rico
parents:
diff changeset
15 for line in fh:
c3ba43704319 Uploaded
rico
parents:
diff changeset
16 if line and not line.startswith( '#' ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
17 line = line.rstrip( '\r\n' )
c3ba43704319 Uploaded
rico
parents:
diff changeset
18 if line:
c3ba43704319 Uploaded
rico
parents:
diff changeset
19 elems = line.split( '\t' )
c3ba43704319 Uploaded
rico
parents:
diff changeset
20 if len( elems ) >= 2 and elems[0] == species:
c3ba43704319 Uploaded
rico
parents:
diff changeset
21 return elems[1]
c3ba43704319 Uploaded
rico
parents:
diff changeset
22
c3ba43704319 Uploaded
rico
parents:
diff changeset
23 raise RuntimeError( "can't find '%s' in location file: %s\n" % ( species, filename ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
24
c3ba43704319 Uploaded
rico
parents:
diff changeset
25
c3ba43704319 Uploaded
rico
parents:
diff changeset
26 class SnpFile( object ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
27 def __init__( self, filename=None, seq_col=1, pos_col=2, ref_seq_col=7, ref_pos_col=8 ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
28 self.filename = filename
c3ba43704319 Uploaded
rico
parents:
diff changeset
29 self.fh = _openfile( filename )
c3ba43704319 Uploaded
rico
parents:
diff changeset
30 self.seq_col = seq_col
c3ba43704319 Uploaded
rico
parents:
diff changeset
31 self.pos_col = pos_col
c3ba43704319 Uploaded
rico
parents:
diff changeset
32 self.ref_seq_col = ref_seq_col
c3ba43704319 Uploaded
rico
parents:
diff changeset
33 self.ref_pos_col = ref_pos_col
c3ba43704319 Uploaded
rico
parents:
diff changeset
34 self.elems = None
c3ba43704319 Uploaded
rico
parents:
diff changeset
35 self.line = None
c3ba43704319 Uploaded
rico
parents:
diff changeset
36 self.comments = []
c3ba43704319 Uploaded
rico
parents:
diff changeset
37
c3ba43704319 Uploaded
rico
parents:
diff changeset
38 def next( self ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
39 while self.fh:
c3ba43704319 Uploaded
rico
parents:
diff changeset
40 try:
c3ba43704319 Uploaded
rico
parents:
diff changeset
41 self.line = self.fh.next()
c3ba43704319 Uploaded
rico
parents:
diff changeset
42 except StopIteration:
c3ba43704319 Uploaded
rico
parents:
diff changeset
43 self.line = None
c3ba43704319 Uploaded
rico
parents:
diff changeset
44 self.elems = None
c3ba43704319 Uploaded
rico
parents:
diff changeset
45 return None
c3ba43704319 Uploaded
rico
parents:
diff changeset
46 if self.line:
c3ba43704319 Uploaded
rico
parents:
diff changeset
47 self.line = self.line.rstrip( '\r\n' )
c3ba43704319 Uploaded
rico
parents:
diff changeset
48 if self.line:
c3ba43704319 Uploaded
rico
parents:
diff changeset
49 if self.line.startswith( '#' ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
50 self.comments.append( self.line )
c3ba43704319 Uploaded
rico
parents:
diff changeset
51 else:
c3ba43704319 Uploaded
rico
parents:
diff changeset
52 self.elems = self.line.split( '\t' )
c3ba43704319 Uploaded
rico
parents:
diff changeset
53 return 1
c3ba43704319 Uploaded
rico
parents:
diff changeset
54
c3ba43704319 Uploaded
rico
parents:
diff changeset
55 def get_seq_pos( self ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
56 if self.elems:
c3ba43704319 Uploaded
rico
parents:
diff changeset
57 return self.elems[ self.seq_col - 1 ], self.elems[ self.pos_col - 1 ]
c3ba43704319 Uploaded
rico
parents:
diff changeset
58 else:
c3ba43704319 Uploaded
rico
parents:
diff changeset
59 return None, None
c3ba43704319 Uploaded
rico
parents:
diff changeset
60
c3ba43704319 Uploaded
rico
parents:
diff changeset
61 def get_ref_seq_pos( self ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
62 if self.elems:
c3ba43704319 Uploaded
rico
parents:
diff changeset
63 return self.elems[ self.ref_seq_seq - 1 ], self.elems[ self.ref_pos_col - 1 ]
c3ba43704319 Uploaded
rico
parents:
diff changeset
64 else:
c3ba43704319 Uploaded
rico
parents:
diff changeset
65 return None, None
c3ba43704319 Uploaded
rico
parents:
diff changeset
66
c3ba43704319 Uploaded
rico
parents:
diff changeset
67
c3ba43704319 Uploaded
rico
parents:
diff changeset
68 class IndexedFile( object ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
69
c3ba43704319 Uploaded
rico
parents:
diff changeset
70 def __init__( self, data_file=None, index_file=None ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
71 self.data_file = data_file
c3ba43704319 Uploaded
rico
parents:
diff changeset
72 self.index_file = index_file
c3ba43704319 Uploaded
rico
parents:
diff changeset
73 self.data_fh = _openfile( data_file )
c3ba43704319 Uploaded
rico
parents:
diff changeset
74 self.index_fh = _openfile( index_file )
c3ba43704319 Uploaded
rico
parents:
diff changeset
75 self._reader = cdblib.Reader( self.index_fh.read(), hash )
c3ba43704319 Uploaded
rico
parents:
diff changeset
76
c3ba43704319 Uploaded
rico
parents:
diff changeset
77 def get_indexed_line( self, key=None ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
78 line = None
c3ba43704319 Uploaded
rico
parents:
diff changeset
79 if key in self._reader:
c3ba43704319 Uploaded
rico
parents:
diff changeset
80 offset = self._reader.getint( key )
c3ba43704319 Uploaded
rico
parents:
diff changeset
81 self.data_fh.seek( offset )
c3ba43704319 Uploaded
rico
parents:
diff changeset
82 try:
c3ba43704319 Uploaded
rico
parents:
diff changeset
83 line = self.data_fh.next()
c3ba43704319 Uploaded
rico
parents:
diff changeset
84 except StopIteration:
c3ba43704319 Uploaded
rico
parents:
diff changeset
85 raise RuntimeError( 'index file out of sync for %s' % key )
c3ba43704319 Uploaded
rico
parents:
diff changeset
86 return line
c3ba43704319 Uploaded
rico
parents:
diff changeset
87
c3ba43704319 Uploaded
rico
parents:
diff changeset
88 class PrimersFile( IndexedFile ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
89 def get_primer_header( self, sequence=None, position=None ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
90 key = "%s %s" % ( str( sequence ), str( position ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
91 header = self.get_indexed_line( key )
c3ba43704319 Uploaded
rico
parents:
diff changeset
92 if header:
c3ba43704319 Uploaded
rico
parents:
diff changeset
93 if header.startswith( '>' ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
94 elems = header.split()
c3ba43704319 Uploaded
rico
parents:
diff changeset
95 if len( elems ) < 3:
c3ba43704319 Uploaded
rico
parents:
diff changeset
96 raise RuntimeError( 'short primers header for %s' % key )
c3ba43704319 Uploaded
rico
parents:
diff changeset
97 if sequence != elems[1] or str( position ) != elems[2]:
c3ba43704319 Uploaded
rico
parents:
diff changeset
98 raise RuntimeError( 'primers index for %s finds %s %s' % ( key, elems[1], elems[2] ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
99 else:
c3ba43704319 Uploaded
rico
parents:
diff changeset
100 raise RuntimeError( 'primers index out of sync for %s' % key )
c3ba43704319 Uploaded
rico
parents:
diff changeset
101 return header
c3ba43704319 Uploaded
rico
parents:
diff changeset
102
c3ba43704319 Uploaded
rico
parents:
diff changeset
103 def get_entry( self, sequence=None, position=None ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
104 entry = self.get_primer_header( sequence, position )
c3ba43704319 Uploaded
rico
parents:
diff changeset
105 if entry:
c3ba43704319 Uploaded
rico
parents:
diff changeset
106 while self.data_fh:
c3ba43704319 Uploaded
rico
parents:
diff changeset
107 try:
c3ba43704319 Uploaded
rico
parents:
diff changeset
108 line = self.data_fh.next()
c3ba43704319 Uploaded
rico
parents:
diff changeset
109 except StopIteration:
c3ba43704319 Uploaded
rico
parents:
diff changeset
110 break
c3ba43704319 Uploaded
rico
parents:
diff changeset
111 if line.startswith( '>' ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
112 break
c3ba43704319 Uploaded
rico
parents:
diff changeset
113 entry += line
c3ba43704319 Uploaded
rico
parents:
diff changeset
114 return entry
c3ba43704319 Uploaded
rico
parents:
diff changeset
115
c3ba43704319 Uploaded
rico
parents:
diff changeset
116 def get_enzymes( self, sequence=None, position=None ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
117 entry = self.get_primer_header( sequence, position )
c3ba43704319 Uploaded
rico
parents:
diff changeset
118 enzyme_list = []
c3ba43704319 Uploaded
rico
parents:
diff changeset
119 if entry:
c3ba43704319 Uploaded
rico
parents:
diff changeset
120 try:
c3ba43704319 Uploaded
rico
parents:
diff changeset
121 line = self.data_fh.next()
c3ba43704319 Uploaded
rico
parents:
diff changeset
122 except StopIteration:
c3ba43704319 Uploaded
rico
parents:
diff changeset
123 raise RuntimeError( 'primers entry for %s %s is truncated' % ( str( sequence ), str( position ) ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
124 if line.startswith( '>' ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
125 raise RuntimeError( 'primers entry for %s %s is truncated' % ( str( sequence ), str( position ) ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
126 line.rstrip( '\r\n' )
c3ba43704319 Uploaded
rico
parents:
diff changeset
127 if line:
c3ba43704319 Uploaded
rico
parents:
diff changeset
128 enzymes = line.split( ',' )
c3ba43704319 Uploaded
rico
parents:
diff changeset
129 for enzyme in enzymes:
c3ba43704319 Uploaded
rico
parents:
diff changeset
130 enzyme = enzyme.strip()
c3ba43704319 Uploaded
rico
parents:
diff changeset
131 if enzyme:
c3ba43704319 Uploaded
rico
parents:
diff changeset
132 enzyme_list.append( enzyme )
c3ba43704319 Uploaded
rico
parents:
diff changeset
133 return enzyme_list
c3ba43704319 Uploaded
rico
parents:
diff changeset
134
c3ba43704319 Uploaded
rico
parents:
diff changeset
135 class SnpcallsFile( IndexedFile ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
136 def get_snp_seq( self, sequence=None, position=None ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
137 key = "%s %s" % ( str( sequence ), str( position ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
138 line = self.get_indexed_line( key )
c3ba43704319 Uploaded
rico
parents:
diff changeset
139 if line:
c3ba43704319 Uploaded
rico
parents:
diff changeset
140 elems = line.split( '\t' )
c3ba43704319 Uploaded
rico
parents:
diff changeset
141 if len (elems) < 3:
c3ba43704319 Uploaded
rico
parents:
diff changeset
142 raise RuntimeError( 'short snpcalls line for %s' % key )
c3ba43704319 Uploaded
rico
parents:
diff changeset
143 if sequence != elems[0] or str( position ) != elems[1]:
c3ba43704319 Uploaded
rico
parents:
diff changeset
144 raise RuntimeError( 'snpcalls index for %s finds %s %s' % ( key, elems[0], elems[1] ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
145 return elems[2]
c3ba43704319 Uploaded
rico
parents:
diff changeset
146 else:
c3ba43704319 Uploaded
rico
parents:
diff changeset
147 return None
c3ba43704319 Uploaded
rico
parents:
diff changeset
148
c3ba43704319 Uploaded
rico
parents:
diff changeset
149 def get_flanking_dna( self, sequence=None, position=None, format='fasta' ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
150 if format != 'fasta' and format != 'primer3':
c3ba43704319 Uploaded
rico
parents:
diff changeset
151 raise RuntimeError( 'invalid format for flanking dna: %s' % str( format ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
152 seq = self.get_snp_seq( sequence, position )
c3ba43704319 Uploaded
rico
parents:
diff changeset
153 if seq:
c3ba43704319 Uploaded
rico
parents:
diff changeset
154 p = seq.find('[')
c3ba43704319 Uploaded
rico
parents:
diff changeset
155 if p == -1:
c3ba43704319 Uploaded
rico
parents:
diff changeset
156 raise RuntimeError( 'snpcalls entry for %s %s missing left bracket: %s' % ( str( sequence ), str( position ), seq ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
157 q = seq.find(']', p + 1)
c3ba43704319 Uploaded
rico
parents:
diff changeset
158 if q == -1:
c3ba43704319 Uploaded
rico
parents:
diff changeset
159 raise RuntimeError( 'snpcalls entry for %s %s missing right bracket: %s' % ( str( sequence ), str( position ), seq ) )
c3ba43704319 Uploaded
rico
parents:
diff changeset
160 q += 1
c3ba43704319 Uploaded
rico
parents:
diff changeset
161
c3ba43704319 Uploaded
rico
parents:
diff changeset
162 if format == 'fasta':
c3ba43704319 Uploaded
rico
parents:
diff changeset
163 flanking_seq = '> '
c3ba43704319 Uploaded
rico
parents:
diff changeset
164 else:
c3ba43704319 Uploaded
rico
parents:
diff changeset
165 flanking_seq = 'SEQUENCE_ID='
c3ba43704319 Uploaded
rico
parents:
diff changeset
166
c3ba43704319 Uploaded
rico
parents:
diff changeset
167 flanking_seq += "%s %s %s %s\n" % ( str( sequence ), str( position ), seq[p+1], seq[p+3] )
c3ba43704319 Uploaded
rico
parents:
diff changeset
168
c3ba43704319 Uploaded
rico
parents:
diff changeset
169 if format == 'primer3':
c3ba43704319 Uploaded
rico
parents:
diff changeset
170 flanking_seq += 'SEQUENCE_TEMPLATE='
c3ba43704319 Uploaded
rico
parents:
diff changeset
171
c3ba43704319 Uploaded
rico
parents:
diff changeset
172 flanking_seq += "%sn%s\n" % ( seq[0:p], seq[q:] )
c3ba43704319 Uploaded
rico
parents:
diff changeset
173
c3ba43704319 Uploaded
rico
parents:
diff changeset
174 if format == 'primer3':
c3ba43704319 Uploaded
rico
parents:
diff changeset
175 flanking_seq += "SEQUENCE_TARGET=%d,11\n=\n" % ( p - 5 )
c3ba43704319 Uploaded
rico
parents:
diff changeset
176
c3ba43704319 Uploaded
rico
parents:
diff changeset
177 return flanking_seq
c3ba43704319 Uploaded
rico
parents:
diff changeset
178 else:
c3ba43704319 Uploaded
rico
parents:
diff changeset
179 return None
c3ba43704319 Uploaded
rico
parents:
diff changeset
180
c3ba43704319 Uploaded
rico
parents:
diff changeset
181
c3ba43704319 Uploaded
rico
parents:
diff changeset
182
c3ba43704319 Uploaded
rico
parents:
diff changeset
183 class LocationFile( object ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
184 def __init__(self, filename):
c3ba43704319 Uploaded
rico
parents:
diff changeset
185 self.build_map(filename)
c3ba43704319 Uploaded
rico
parents:
diff changeset
186
c3ba43704319 Uploaded
rico
parents:
diff changeset
187 def build_map(self, filename):
c3ba43704319 Uploaded
rico
parents:
diff changeset
188 self.map = {}
c3ba43704319 Uploaded
rico
parents:
diff changeset
189 self.open_file(filename)
c3ba43704319 Uploaded
rico
parents:
diff changeset
190 for line in self.read_lines():
c3ba43704319 Uploaded
rico
parents:
diff changeset
191 elems = line.split('\t', 1)
c3ba43704319 Uploaded
rico
parents:
diff changeset
192 if len(elems) == 2:
c3ba43704319 Uploaded
rico
parents:
diff changeset
193 self.map[ elems[0].strip() ] = elems[1].strip()
c3ba43704319 Uploaded
rico
parents:
diff changeset
194 self.close_file()
c3ba43704319 Uploaded
rico
parents:
diff changeset
195
c3ba43704319 Uploaded
rico
parents:
diff changeset
196 def read_lines(self):
c3ba43704319 Uploaded
rico
parents:
diff changeset
197 for line in self.fh:
c3ba43704319 Uploaded
rico
parents:
diff changeset
198 if not line.startswith('#'):
c3ba43704319 Uploaded
rico
parents:
diff changeset
199 line = line.rstrip('\r\n')
c3ba43704319 Uploaded
rico
parents:
diff changeset
200 yield line
c3ba43704319 Uploaded
rico
parents:
diff changeset
201
c3ba43704319 Uploaded
rico
parents:
diff changeset
202 def open_file(self, filename):
c3ba43704319 Uploaded
rico
parents:
diff changeset
203 self.filename = filename
c3ba43704319 Uploaded
rico
parents:
diff changeset
204 try:
c3ba43704319 Uploaded
rico
parents:
diff changeset
205 self.fh = open(filename, 'r')
c3ba43704319 Uploaded
rico
parents:
diff changeset
206 except IOError, err:
c3ba43704319 Uploaded
rico
parents:
diff changeset
207 print >> sys.stderr, "Error opening location file '%s': %s" % (filename, str(err))
c3ba43704319 Uploaded
rico
parents:
diff changeset
208 sys.exit(1)
c3ba43704319 Uploaded
rico
parents:
diff changeset
209
c3ba43704319 Uploaded
rico
parents:
diff changeset
210 def close_file(self):
c3ba43704319 Uploaded
rico
parents:
diff changeset
211 self.fh.close()
c3ba43704319 Uploaded
rico
parents:
diff changeset
212
c3ba43704319 Uploaded
rico
parents:
diff changeset
213 def loc_file( self, key ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
214 if key in self.map:
c3ba43704319 Uploaded
rico
parents:
diff changeset
215 return self.map[key]
c3ba43704319 Uploaded
rico
parents:
diff changeset
216 else:
c3ba43704319 Uploaded
rico
parents:
diff changeset
217 print >> sys.stderr, "'%s' does not appear in location file '%s'" % (key, self.filename)
c3ba43704319 Uploaded
rico
parents:
diff changeset
218 sys.exit(1)
c3ba43704319 Uploaded
rico
parents:
diff changeset
219
c3ba43704319 Uploaded
rico
parents:
diff changeset
220 class ChrLens( object ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
221 def __init__( self, chrlen_filename ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
222 self.chrlen_filename = chrlen_filename
c3ba43704319 Uploaded
rico
parents:
diff changeset
223 self.build_map()
c3ba43704319 Uploaded
rico
parents:
diff changeset
224
c3ba43704319 Uploaded
rico
parents:
diff changeset
225 def build_map(self):
c3ba43704319 Uploaded
rico
parents:
diff changeset
226 self.map = {}
c3ba43704319 Uploaded
rico
parents:
diff changeset
227 self.open_file(self.chrlen_filename)
c3ba43704319 Uploaded
rico
parents:
diff changeset
228 for line in self.read_lines():
c3ba43704319 Uploaded
rico
parents:
diff changeset
229 elems = line.split('\t', 1)
c3ba43704319 Uploaded
rico
parents:
diff changeset
230 if len(elems) == 2:
c3ba43704319 Uploaded
rico
parents:
diff changeset
231 chrom = elems[0].strip()
c3ba43704319 Uploaded
rico
parents:
diff changeset
232 chrom_len_text = elems[1].strip()
c3ba43704319 Uploaded
rico
parents:
diff changeset
233 try:
c3ba43704319 Uploaded
rico
parents:
diff changeset
234 chrom_len = int( chrom_len_text )
c3ba43704319 Uploaded
rico
parents:
diff changeset
235 except ValueError:
c3ba43704319 Uploaded
rico
parents:
diff changeset
236 print >> sys.stderr, "Bad length '%s' for chromosome '%s' in '%s'" % (chrom_len_text, chrom, self.chrlen_filename)
c3ba43704319 Uploaded
rico
parents:
diff changeset
237 self.map[ chrom ] = chrom_len
c3ba43704319 Uploaded
rico
parents:
diff changeset
238 self.close_file()
c3ba43704319 Uploaded
rico
parents:
diff changeset
239
c3ba43704319 Uploaded
rico
parents:
diff changeset
240 def read_lines(self):
c3ba43704319 Uploaded
rico
parents:
diff changeset
241 for line in self.fh:
c3ba43704319 Uploaded
rico
parents:
diff changeset
242 if not line.startswith('#'):
c3ba43704319 Uploaded
rico
parents:
diff changeset
243 line = line.rstrip('\r\n')
c3ba43704319 Uploaded
rico
parents:
diff changeset
244 yield line
c3ba43704319 Uploaded
rico
parents:
diff changeset
245
c3ba43704319 Uploaded
rico
parents:
diff changeset
246 def open_file(self, filename):
c3ba43704319 Uploaded
rico
parents:
diff changeset
247 self.filename = filename
c3ba43704319 Uploaded
rico
parents:
diff changeset
248 try:
c3ba43704319 Uploaded
rico
parents:
diff changeset
249 self.fh = open(filename, 'r')
c3ba43704319 Uploaded
rico
parents:
diff changeset
250 except IOError, err:
c3ba43704319 Uploaded
rico
parents:
diff changeset
251 print >> sys.stderr, "Error opening chromosome length file '%s': %s" % (filename, str(err))
c3ba43704319 Uploaded
rico
parents:
diff changeset
252 sys.exit(1)
c3ba43704319 Uploaded
rico
parents:
diff changeset
253
c3ba43704319 Uploaded
rico
parents:
diff changeset
254 def close_file(self):
c3ba43704319 Uploaded
rico
parents:
diff changeset
255 self.fh.close()
c3ba43704319 Uploaded
rico
parents:
diff changeset
256
c3ba43704319 Uploaded
rico
parents:
diff changeset
257 def length( self, key ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
258 if key in self.map:
c3ba43704319 Uploaded
rico
parents:
diff changeset
259 return self.map[key]
c3ba43704319 Uploaded
rico
parents:
diff changeset
260 else:
c3ba43704319 Uploaded
rico
parents:
diff changeset
261 return None
c3ba43704319 Uploaded
rico
parents:
diff changeset
262
c3ba43704319 Uploaded
rico
parents:
diff changeset
263 def __iter__( self ):
c3ba43704319 Uploaded
rico
parents:
diff changeset
264 for chrom in self.map:
c3ba43704319 Uploaded
rico
parents:
diff changeset
265 yield chrom
c3ba43704319 Uploaded
rico
parents:
diff changeset
266