Mercurial > repos > jjohnson > ensembl_variant_report
comparison ensembl_variant_report.py @ 8:fd612f8119a2 draft
planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/ensembl_variant_report commit f003aece24587f68b883449f278f1e601110e2ec-dirty
author | jjohnson |
---|---|
date | Tue, 17 Jul 2018 12:21:36 -0400 |
parents | d5cb252c68da |
children | 0ef485da6ba6 |
comparison
equal
deleted
inserted
replaced
7:d5cb252c68da | 8:fd612f8119a2 |
---|---|
94 ref = fields[ri] | 94 ref = fields[ri] |
95 alts = fields[ai] | 95 alts = fields[ai] |
96 dp = int(fields[di]) | 96 dp = int(fields[di]) |
97 dpr = [int(x) for x in fields[fi].split(',')] | 97 dpr = [int(x) for x in fields[fi].split(',')] |
98 for i,alt in enumerate(alts.split(',')): | 98 for i,alt in enumerate(alts.split(',')): |
99 freq = float(dpr[i+1])/float(sum(dpr)) if dpr else None | 99 freq = float(dpr[i+1])/float(dp) if dp and dpr else \ |
100 float(dpr[i+1])/float(sum(dpr)) if dpr else None | |
100 yield (transcript,pos,ref,alt,dp,freq) | 101 yield (transcript,pos,ref,alt,dp,freq) |
101 | 102 |
102 def parse_snpeff_vcf(): | 103 def parse_snpeff_vcf(): |
103 for linenum,line in enumerate(inputFile): | 104 for linenum,line in enumerate(inputFile): |
104 if line.startswith('##'): | 105 if line.startswith('##'): |
129 (alt,eff,impact,gene_name,gene_id,feature_type,transcript,biotype,exon,c_hgvs,p_hgvs,cdna,cds,aa,distance,info) = effect.split('|') | 130 (alt,eff,impact,gene_name,gene_id,feature_type,transcript,biotype,exon,c_hgvs,p_hgvs,cdna,cds,aa,distance,info) = effect.split('|') |
130 elif key == 'EFF': | 131 elif key == 'EFF': |
131 (eff, effs) = effect.rstrip(')').split('(') | 132 (eff, effs) = effect.rstrip(')').split('(') |
132 (impact, functional_class, codon_change, aa_change, aa_len, gene_name, biotype, coding, transcript, exon, alt) = effs.split('|')[0:11] | 133 (impact, functional_class, codon_change, aa_change, aa_len, gene_name, biotype, coding, transcript, exon, alt) = effs.split('|')[0:11] |
133 i = alt_list.index(alt) if alt in alt_list else 0 | 134 i = alt_list.index(alt) if alt in alt_list else 0 |
134 freq = float(dpr[i+1])/float(sum(dpr)) if dpr else None | 135 freq = float(dpr[i+1])/float(dp) if dp and dpr else \ |
136 float(dpr[i+1])/float(sum(dpr)) if dpr else None | |
135 yield (transcript,pos,ref,alt,dp,freq) | 137 yield (transcript,pos,ref,alt,dp,freq) |
136 | 138 |
137 | 139 |
138 #Process gene model | 140 #Process gene model |
139 ens_ref = None | 141 ens_ref = None |