comparison data_manager/data_manager_snpEff_download.py @ 2:6ad9205c1307

Update to SnpEff version 3.3
author Jim Johnson <jj@umn.edu>
date Fri, 04 Oct 2013 09:09:29 -0500
parents e1d9f6a0ad53
children 8952990fcab9
comparison
equal deleted inserted replaced
1:bea875f081e8 2:6ad9205c1307
20 20
21 """ 21 """
22 # Download human database 'hg19' 22 # Download human database 'hg19'
23 java -jar snpEff.jar download -v hg19 23 java -jar snpEff.jar download -v hg19
24 24
25 <command>java -jar \$JAVA_JAR_PATH/snpEff.jar download -c \$JAVA_JAR_PATH/snpEff.config $genomeVersion > $logfile </command> 25 <command>java -jar \$SNPEFF_JAR_PATH/snpEff.jar download -c \$JAVA_JAR_PATH/snpEff.config $genomeVersion > $logfile </command>
26 26
27 snpEffectPredictor.bin 27 snpEffectPredictor.bin
28 regulation_HeLa-S3.bin 28 regulation_HeLa-S3.bin
29 regulation_pattern = 'regulation_(.+).bin' 29 regulation_pattern = 'regulation_(.+).bin'
30 30
63 return_code = proc.wait() 63 return_code = proc.wait()
64 if return_code: 64 if return_code:
65 sys.exit( return_code ) 65 sys.exit( return_code )
66 ## search data_dir/genome_version for files 66 ## search data_dir/genome_version for files
67 regulation_pattern = 'regulation_(.+).bin' 67 regulation_pattern = 'regulation_(.+).bin'
68 # annotation files that are included in snpEff by a flag
69 annotations_dict = {'nextProt.bin' : '-nextprot','motif.bin': '-motif'}
68 genome_path = os.path.join(data_dir,genome_version) 70 genome_path = os.path.join(data_dir,genome_version)
69 if os.path.isdir(genome_path): 71 if os.path.isdir(genome_path):
70 for root, dirs, files in os.walk(genome_path): 72 for root, dirs, files in os.walk(genome_path):
71 for fname in files: 73 for fname in files:
72 if fname.startswith('snpEffectPredictor'): 74 if fname.startswith('snpEffectPredictor'):
76 _add_data_table_entry( data_manager_dict, 'snpeff_genomedb', data_table_entry ) 78 _add_data_table_entry( data_manager_dict, 'snpeff_genomedb', data_table_entry )
77 else: 79 else:
78 m = re.match(regulation_pattern,fname) 80 m = re.match(regulation_pattern,fname)
79 if m: 81 if m:
80 name = m.groups()[0] 82 name = m.groups()[0]
81 data_table_entry = dict(value=genome_version, name=name) 83 data_table_entry = dict(genome=genome_version,value=name, name=name)
82 _add_data_table_entry( data_manager_dict, 'snpeff_regulationdb', data_table_entry ) 84 _add_data_table_entry( data_manager_dict, 'snpeff_regulationdb', data_table_entry )
85 elif fname in annotations_dict:
86 value = annotations_dict[fname]
87 name = value.lstrip('-')
88 data_table_entry = dict(genome=genome_version,value=value, name=name)
89 _add_data_table_entry( data_manager_dict, 'snpeff_annotations', data_table_entry )
83 return data_manager_dict 90 return data_manager_dict
84 91
85 def _add_data_table_entry( data_manager_dict, data_table, data_table_entry ): 92 def _add_data_table_entry( data_manager_dict, data_table, data_table_entry ):
86 data_manager_dict['data_tables'] = data_manager_dict.get( 'data_tables', {} ) 93 data_manager_dict['data_tables'] = data_manager_dict.get( 'data_tables', {} )
87 data_manager_dict['data_tables'][data_table] = data_manager_dict['data_tables'].get( data_table, [] ) 94 data_manager_dict['data_tables'][data_table] = data_manager_dict['data_tables'].get( data_table, [] )