changeset 5:84c6f3bcfd4a draft

Uploaded
author davidvanzessen
date Wed, 05 Aug 2015 10:22:10 -0400
parents 035600ab7d3c
children 752528a5934d
files OMT_coding.txt phenotype_gene_relations.r phenotype_gene_relations.sh
diffstat 3 files changed, 533 insertions(+), 4 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/OMT_coding.txt	Wed Aug 05 10:22:10 2015 -0400
@@ -0,0 +1,523 @@
+ID	OMT.name
+1	1. Malformation
+2	2. Deformation
+3	3. Dysplasia
+11	1A. Entire limb malformations
+12	1B. Handplate malformations
+21	Constriction ring sequence
+22	Trigger digits
+31	3A. Hypertrophy
+32	3B. Tumorous conditions
+110	1A. NOS entire limb malformation
+111	1A1. Proximal-distal axis (entire limb)
+112	1A2. Radio-ulnar axis (entire limb)
+113	1A4. Unspecified axis (entire limb)
+114	1A3. Dorso-ventral axis (entire limb)
+120	1B. NOS handplate malformation
+121	1B1. Proximal-distal axis (hand)
+122	1B2. Radio-ulnar axis (hand)
+123	1B3. Dorso-ventral axis (hand)
+124	1B4. Unspecified axis (hand)
+210	Constriction ring sequence
+220	Trigger digits
+311	3A1. Whole limb hypertrophy
+312	3A2. Partial Limb hypertrophy
+321	3B1. Vascular tumors
+324	3B4. Skeletal tumors
+1100	1A. NOS malformation (entire limb)
+1110	1A1. NOS prox-distal axis (entire limb)
+1111	1A1i. Brachymelia
+1112	1A1ii. Symbrachydactyly
+1113	1A1iii. Transverse deficiency
+1114	1A1iv. Intersegmental deficiency
+1115	1A1v. Limb duplication
+1120	1A2. NOS rad-uln axis (entire limb)
+1121	1A2i. Radial longitudinal deficiency
+1122	1A2ii. Ulnar longitudinal deficiency
+1124	1A2iv. Radioulnar synostosis
+1125	1A2v. Congenital radial head dislocation
+1126	1A2vi. Humeroradial synostosis
+1127	1A2vii. Madelung deformity
+1131	1A3i. Dorsal dimelia (palmar nail)
+1132	1A3ii. Ventral dimelia 
+1141	1A4i. Abberant shoulder (incl Sprengel deformity)
+1142	1A4ii. Arthrogryposis
+1200	1B. NOS malformation (hand)
+1211	1B1i. Brachydactyly
+1213	1B1iii. Transverse deficiency (no arm involvement)
+1220	1B2. NOS rad-uln axis malformation (hand)
+1221	1B2i. Radial deficiency of the hand
+1222	1B2ii. Ulnar deficiency of the hand
+1223	1B2iii. Radial polydactyly
+1224	1B2iv. Triphalangeal thumb
+1225	1B2v. Ulnar dimelia
+1226	1B2vi. Ulnar polydactyly
+1232	1B3ii. Ventral dimelia (incl hypoplastic/aplastic nail)
+1241	1B4i. Softi tissue malformations
+1242	1B4ii. Sekeltal deficiencies
+1243	1B4iii. Complex anomalies of unspecified axis (hand)
+2100	Constriction ring sequence
+2200	Trigger digits
+3111	3A1i. Hemihypertrophy
+3121	3A2i. Macrodactyly
+3211	3B1i. Hemangioma
+3212	3B1ii. Vascular malformation
+3241	3B4i. Osteochondromatosis
+3242	3B4ii. Echondromatosis
+3244	3B4iv. Epiphyseal abnormalities
+11000	1A. NOS entire limb malformation
+11100	1A1. NOS proximal-distal axis malformation
+11110	1A1i. Brachymelia
+11121	1A1iia. Poland Syndrome
+11130	1A1iii. Transverse deficiency
+11140	1A1iv. Intersegmental deficiency
+11150	1A1v. Limb duplication
+11200	1A2. NOS rad-uln axis (entire limb)
+11210	1A2i. Radial longitudinal deficiency
+11220	1A2ii. Ulnar longitudinal deficiency
+11240	1A2iv. Radioulnar synostosis
+11250	1A2v. Congenital radial head dislocation
+11260	1A2vi. Humeroradial synostosis
+11270	1A2vii. Madelung deformity
+11310	1A3i. Dorsal dimelia (palmar nail)
+11320	1A3ii. Ventral dimelia 
+11411	1A4ia. Sprengel deformity
+11412	1A4ib. Abnormal shoulder muscles
+11413	1A4ic. NOS shoulder malformation
+11420	1A4ii. Arthrogryposis
+12000	1B. NOS handplate malformation
+12110	1B1i. Brachydactyly
+12130	1B1iii. Transverse deficiency (no arm involvement)
+12200	1B2. NOS rad-uln axis malformation (hand)
+12210	1B2i. Radial deficiency of the hand
+12220	1B2ii. Ulnar deficiency of the hand
+12230	1B2iii. Radial polydactyly
+12240	1B2iv. Triphalangeal thumb
+12250	1B2v. Ulnar dimelia
+12260	1B2vi. Ulnar polydactyly
+12320	1B3ii. Ventral dimelia (incl hypoplastic/aplastic nail)
+12411	1B4ia. Syndactyly
+12412	1B4ib. Camptodactyly
+12413	1B4ic. Thumb in palm deformity
+12414	1B4id. Distal arthrogryposis
+12421	1B4iia. Clinodactyly
+12423	1B4iib. Synostosis/symphalangism
+12431	1B4iiia. Complex syndactyly
+12432	1B4iiib. Synpolydactyly
+12433	1B4iiic. Cleft Hand
+12434	1B4iiid. Apert Hand
+21000	Constriction ring sequence
+22000	Trigger digits
+31110	3A1i. Hemihypertrophy
+31210	3A2i. Macrodactyly
+32110	3B1i. Hemangioma
+32120	3B1ii. Vascular malformation
+32410	3B4i. Osteochondromatosis
+32420	3B4ii. Echondromatosis
+32440	3B4iv. Epiphyseal abnormalities
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
--- a/phenotype_gene_relations.r	Fri Jul 24 07:04:56 2015 -0400
+++ b/phenotype_gene_relations.r	Wed Aug 05 10:22:10 2015 -0400
@@ -15,7 +15,8 @@
 phenotypic.groups.file = args[2]
 hpo.to.omt.file = args[3]
 inheritance.from.group.0.file = args[4]
-final.file = args[5]
+omt.coding.file = args[5]
+final.file = args[6]
 
 #get ALL_SOURCES_ALL_FREQUENCIES.TXT
 all.sources = read.table(all.sources.file, header=T, sep="\t", comment.char="#", quote = "")
@@ -67,8 +68,13 @@
 final = merge(final, subset.hand.filter.0[,c("gene.symbol", "diseaseId", "HPO.term.name")], by=c("gene.symbol", "diseaseId"), all.x=T, all.y=F)
 final$HPO.term.name.y = as.character(final$HPO.term.name.y)
 final$HPO.term.name.y[is.na(final$HPO.term.name.y)] = "No inheritance pattern available"
-final = final[,c("diseaseId", "gene.symbol", "gene.id.entrez.", "HPO.term.name.x", "variable", "GROUP.CODE", "value", "OMT.1", "OMT.2", "OMT.3", "OMT.4", "OMT.5", "HPO.term.name.y")]
-names(final) = c("diseaseId", "gene.symbol", "gene.id.entrez.", "HPO.term.name", "GROUP.CODE", "number", "ratio", "OMT.1", "OMT.2", "OMT.3", "OMT.4", "OMT.5", "inheritance")
+
+omt.coding = read.table(omt.coding.file, header=T, sep="\t", comment.char="#", quote = "", stringsAsFactors=F)
+omt.coding = rbind(omt.coding, c("0", "N/C"))
+final = merge(final, omt.coding, by.x="OMT.5", by.y="ID", all.x=T)
+
+final = final[,c("diseaseId", "gene.symbol", "gene.id.entrez.", "HPO.term.name.x", "variable", "value", "OMT.1", "OMT.2", "OMT.3", "OMT.4", "OMT.5", "HPO.term.name.y", "OMT.name")]
+names(final) = c("diseaseId", "gene.symbol", "gene.id.entrez.", "HPO.term.name", "GROUP.CODE", "ratio", "OMT.1", "OMT.2", "OMT.3", "OMT.4", "OMT.5", "inheritance", "OMT.name")
 write.table(final, file=final.file, quote=F, sep="\t", row.names=F, col.names=T)
 
 
--- a/phenotype_gene_relations.sh	Fri Jul 24 07:04:56 2015 -0400
+++ b/phenotype_gene_relations.sh	Wed Aug 05 10:22:10 2015 -0400
@@ -8,4 +8,4 @@
 inheritence_from_group_0=$4
 output=$5
 
-Rscript --verbose $dir/phenotype_gene_relations.r "$all_sources" "$phenotypic_groups" "$hpo_to_omt" "$inheritence_from_group_0" "$output" 2>&1
+Rscript --verbose $dir/phenotype_gene_relations.r "$all_sources" "$phenotypic_groups" "$hpo_to_omt" "$inheritence_from_group_0" "$dir/OMT_coding.txt" "$output" 2>&1