Mercurial > repos > elixir-it > corgat_funct_annot
changeset 1:40b81942976a draft default tip
Uploaded
author | elixir-it |
---|---|
date | Tue, 16 Feb 2021 09:14:20 +0000 |
parents | 7e7168ebc150 |
children | |
files | FunAnn/annotate.pl |
diffstat | 1 files changed, 21 insertions(+), 10 deletions(-) [+] |
line wrap: on
line diff
--- a/FunAnn/annotate.pl Fri Oct 30 13:38:39 2020 +0000 +++ b/FunAnn/annotate.pl Tue Feb 16 09:14:20 2021 +0000 @@ -1,10 +1,10 @@ $fss=13468; -unless (-e "CorGAT") - +unless (-e "GCF_009858895.2_ASM985889v3_genomic.fna") { - system("wget -i https://raw.githubusercontent.com/matteo14c/CorGAT_galaxy/dev/ann.txt"); - system("gzip -d GCF_009858895.2_ASM985889v3_genomic.fna.gz"); + + system("wget -i https://raw.githubusercontent.com/matteo14c/CorGAT_galaxy/master/ann.txt"); + system("gzip -d GCF_009858895.2_ASM985889v3_genomic.fna.gz"); } $gen_code="genetic_code"; @@ -16,7 +16,7 @@ $code{$triplet}=$oneL; } -$genome="GCF_009858895.2_ASM985889v3_genomic.fna"; +$genome="GCF_009858895.2_ASM985889v3_genomic.fna "; die("need reference genome file in the current folder\n") unless -e "GCF_009858895.2_ASM985889v3_genomic.fna"; open(IN,$genome); while(<IN>) @@ -58,10 +58,10 @@ $res=$seq_res[$i]; } } -%AF_data=%{read_simple_table("af_data_new.csv")}; +%AF_data=%{read_simple_table("AF_current.csv")}; %MFE_data=%{read_simple_table("MFE_annot.csv")}; %epi_data=%{read_epitopes("epitopes_annot.csv")}; -%hyphy_data=%{read_hyphy("hyphy_novel.csv")}; +%hyphy_data=%{read_hyphy("hyphy_current.csv")}; @@ -172,7 +172,7 @@ }elsif ($mod==0){ $triplet=substr($seq,$pos-3,3); @Bs=split('',$triplet); - die("3\n $triplet b:$Bs[2] r:$ref")unless ($Bs[2] eq $ref); + die("$_ 3\n $triplet b:$Bs[2] r:$ref")unless ($Bs[2] eq $ref); $Bs[2]=$alt; } #print "$pos_inG $relpos $mod @Bs\n"; @@ -280,11 +280,22 @@ { $eff.="Ins"; $Talt=(translate($Calt,\%code))[1]; + if ($Cref=~/[ACTG]{1,}/) + { + $Cref=~s/\.//g; + $Tref=(translate($Cref,\%code))[1]; + } + } if ($alt=~/\./) { $eff.="Del"; $Tref=(translate($Cref,\%code))[1]; + if ($Calt=~/[ACTG]{1,}/) + { + $Calt=~s/\.//g; + $Talt=(translate($Calt,\%code))[1]; + } } if ($eff=~/Del/) { @@ -388,9 +399,9 @@ ($gene,$pos,@annot)=(split(/\,/)); foreach $a (@annot) { + $a=~s/{//g; + $a=~s/}//g; ($ref,$key)=(split(/\:/,$a)); - $ref=~s/{//g; - $ref=~s/}//g; $ref=~s/"//g; $key=~s/"//g; #print "$gene $pos $ref $key\n";