# ESAM

Data extracted from [Lecca M, et al. (2023) Bi-allelic variants in the ESAM tight-junction gene cause a neurodevelopmental disorder associated with fetal intracranial hemorrhage. Am J Hum Genet ;110(4):681-690.  PMID:36996813](https://pubmed.ncbi.nlm.nih.gov/36996813/)

In [1]:
import pandas as pd
pd.set_option('display.max_colwidth', None) # show entire column contents, important!
from IPython.display import display, HTML
from pyphetools.creation import *
from pyphetools.visualization import *
from pyphetools.validation import *
import pyphetools
print(f"Using pyphetools version {pyphetools.__version__}")

Using pyphetools version 0.9.15


In [2]:
PMID = "PMID:36996813"
title = "Bi-allelic variants in the ESAM tight-junction gene cause a neurodevelopmental disorder associated with fetal intracranial hemorrhage"
cite = Citation(pmid=PMID, title=title)
parser = HpoParser("../hp.json")
hpo_cr = parser.get_hpo_concept_recognizer()
hpo_version = parser.get_version()
hpo_ontology = parser.get_ontology()
metadata = MetaData(created_by="ORCID:0000-0002-5648-2155", citation=cite)
metadata.default_versions_with_hpo(version=hpo_version)
print(f"HPO version {hpo_version}")

HPO version 2023-10-09


In [3]:
df = pd.read_excel("input/esam_lecca_2023.xlsx");
#df.head()
dft = df.transpose()
dft.columns = dft.iloc[0]
dft.drop(dft.index[0], inplace=True)
dft.head()
dft.index  # first check the index
dft['individual_id'] = dft.index  # Set the new column 'patient_id' to be identical to the contents of the index
#dft.head() # c

In [4]:
generator = SimpleColumnMapperGenerator(df=dft, hpo_cr=hpo_cr, observed="+", excluded="-")
column_mapper_d = generator.try_mapping_columns()
display(HTML(generator.to_html()))

Result,Columns
Mapped,Microcephaly; Delayed speech and language development; Hypotonia; Spasticity; Epilepsy; Dilation of lateral ventricles; Thin corpus callosum; Abnormal myelination; Hydrocephalus
Unmapped,ESAM variant (NM_138961.3); NM_138961.3; Location; ACMG classification; ROH (GRCh38/hg38); Sequencing analysis; Chromosomal microarray analysis; Further familial segregation data ; Sex; Geographical origin; Consanguinity; Onset of symptoms; Current age; Gestational age at delivery; Mode of delivery; BirthWeight; BirthHeight; BirthOFC ; APGAR score; Age; Weight; Height; OFC; Dysmorphic features; Global developmental delay/unspecified intellectual disability; Intracranial; Retinal; Other_findings; individual_id


In [5]:
#res = OptionColumnMapper.autoformat(df=dft, concept_recognizer=hpo_cr, omit_columns=generator.get_mapped_columns())
#print(res)

In [6]:
birthweight_d = {
 '2150 g (<3rd percentile)': 'Small for gestational age',
}
birthweight_Mapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=birthweight_d)
birthweight_Mapper.preview_column(dft['BirthWeight'])
column_mapper_d['BirthWeight'] = birthweight_Mapper

In [7]:
weight_d = {
 '12 kg (<3rd percentile)': 'Decreased body weight',
 '7.6 kg (<3rd percentile)': 'Decreased body weight',
 '8.07 kg (<3rd percentile)': 'Decreased body weight',
 '17 kg (<3rd percentile)': 'Decreased body weight',
 '7.9 kg (<3rd percentile)': 'Decreased body weight',
}
weight_Mapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=weight_d)
weight_Mapper.preview_column(dft['Weight'])
column_mapper_d['Weight'] = weight_Mapper

In [8]:
height_d = {
 '78 cm (<3rd percentile)': 'Short stature',
 '97 cm (<3rd percentile)': 'Short stature',
 '73 cm (<3rd percentile)': 'Short stature',
}
heightMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=height_d)
heightMapper.preview_column(dft['Height'])
column_mapper_d['Height'] = heightMapper

In [9]:
# Microcephaly HP:0000252
microcephaly_Mapper = SimpleColumnMapper(hpo_id="HP:0000252", hpo_label="Microcephaly", observed="+", excluded="-")
microcephaly_Mapper.preview_column(dft['Microcephaly'])
column_mapper_d['Microcephaly'] = microcephaly_Mapper

In [10]:
dysmorphic_features_d = {'Bitemporal narrowing': 'Narrow forehead',
 'Highly arched eyebrow': 'Highly arched eyebrow',
 'Long eyelashes': 'Long eyelashes',
 'Bulbous nasal tip': 'Bulbous nose',
 'Fleshy and everted lower lip vermilion': 'Everted lower lip vermilion',
 'Upslanted palpebral fissure': 'Upslanted palpebral fissure',
 'Microretrognathia': 'Microretrognathia',
 'Synophrys': 'Synophrys',
 'Full cheeks': 'Full cheeks',
 'Hypertrichosis': 'Hypertrichosis',
 'Triangular face': 'Triangular face',
 'Smooth philtrum': 'Smooth philtrum',
 'Prominent chin': 'Mandibular prognathia',
 'High palate': 'High palate',
 'narrow palate': 'Narrow palate',
 'Tented upper lip vermilion': 'Tented upper lip vermilion',
 'Hammertoe': 'Hammertoe',
 'Telecanthus': 'Telecanthus',
 'Wide nasal bridge': 'Wide nasal bridge',
 'Finger joint hypermobility': 'Finger joint hypermobility',
 'Talipes equinovarus': 'Talipes equinovarus',
 'Amblyopia': 'Amblyopia',
 'Flat philtrum': 'Smooth philtrum',
 'Upslanted palpebral fissures': 'Upslanted palpebral fissure',
 'Broad forehead': 'Broad forehead',
 'Undescended testicle': 'Cryptorchidism',
 'Highly arched eyebrows': 'Highly arched eyebrow',
 'Low posteriorly rotated ears': 'Posteriorly rotated ears',
 'Anteverted nares': 'Anteverted nares',
}
dysmorphic_featuresMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=dysmorphic_features_d)
dysmorphic_featuresMapper.preview_column(dft['Dysmorphic features'])
column_mapper_d['Dysmorphic features'] = dysmorphic_featuresMapper

In [11]:
gdd_d = {'+ (severe)': 'Severe global developmental delay',
 'No walking': 'Inability to walk',
 'Poor head control': 'Poor head control',
 'No sitting': 'Delayed ability to sit',
 '[@[Individual 7]]No walking': 'Inability to walk',
 '(does not sit nor roll over)': 'Delayed ability to sit',
}
gddMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=gdd_d)
gddMapper.preview_column(dft['Global developmental delay/unspecified intellectual disability'])
column_mapper_d['Global developmental delay/unspecified intellectual disability'] = gddMapper

In [12]:
delayed_speech_and_language_development_d = {'+ (severe)': 'Delayed speech and language development',
                                             '+': 'Delayed speech and language development',
}
delayed_speech_and_language_developmentMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=delayed_speech_and_language_development_d)
delayed_speech_and_language_developmentMapper.preview_column(dft['Delayed speech and language development'])
column_mapper_d['Delayed speech and language development'] = delayed_speech_and_language_developmentMapper

In [13]:
hypotonia__d = {'+ (neonatal)': 'Hypotonia',
 'neonatal': 'Hypotonia',
 '+': 'Hypotonia',
 }
hypotonia_Mapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=hypotonia__d)
hypotonia_Mapper.preview_column(dft['Hypotonia'])
column_mapper_d['Hypotonia'] = hypotonia_Mapper

In [14]:
spasticity__d = {'+ (spastic tetraparesis)': 'Spastic tetraparesis',
 '+ (spastic tetraparesis': 'Spastic tetraparesis',
 'hyperreflexia)': 'Hyperreflexia',
 '+  (spastic tetraparesis)': 'Spastic tetraparesis',
 '+ (dystonia)': 'Dystonia',
 '+ (limb hypertonia)': 'Limb hypertonia',
}
spasticity_Mapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=spasticity__d)
spasticity_Mapper.preview_column(dft['Spasticity'])
column_mapper_d['Spasticity'] = spasticity_Mapper

In [15]:
epilepsy_d = {'+ (focal)': 'Focal-onset seizure',
 '+': 'Seizure',
 '+ (focal': 'Focal-onset seizure',
 'myoclonic) \nHypsarrhythmia': 'Hypsarrhythmia',
 'myoclonic) Hypsarrhythmia': 'Hypsarrhythmia',
 '+ (generalized tonic-clonic seizures)': 'Bilateral tonic-clonic seizure',
}
epilepsyMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=epilepsy_d)
epilepsyMapper.preview_column(dft['Epilepsy'])
column_mapper_d['Epilepsy'] = epilepsyMapper

In [16]:
dilation_of_lateral_ventricles__d = {'+': 'Dilated third ventricle',
 '+ (lateral and 3rd ventricles)': ["Dilated third ventricle", "Lateral ventricle dilatation"],
}
dilation_of_lateral_ventricles_Mapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=dilation_of_lateral_ventricles__d)
dilation_of_lateral_ventricles_Mapper.preview_column(dft['Dilation of lateral ventricles'])
column_mapper_d['Dilation of lateral ventricles'] = dilation_of_lateral_ventricles_Mapper

In [17]:
thin_corpus_callosum_d = {'+ (atrophy)': ["Corpus callosum atrophy", 'Thin corpus callosum'],
 '+ (partial absence of the septum pellucidum)': ['Thin corpus callosum','Partial absence of the septum pellucidum'],
 '+': 'Thin corpus callosum',
}
excluded = {'-': 'Thin corpus callosum'}
thin_corpus_callosumMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=thin_corpus_callosum_d, excluded_d=excluded)
thin_corpus_callosumMapper.preview_column(dft['Thin corpus callosum'])
column_mapper_d['Thin corpus callosum'] = thin_corpus_callosumMapper

In [18]:
abnormal_myelination_d = {'+ (FWML)': 'Abnormal CNS myelination',
 '+ (FWML - frontoparietal)': 'Abnormal CNS myelination',
 '+ (FWML - periventricular)': 'Abnormal CNS myelination',
 '+ (dysgiria/polymicrogyria': 'Polymicrogyria',
 'white matter volume loss)': 'Reduced cerebral white matter volume',
}
abnormal_myelinationMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=abnormal_myelination_d)
abnormal_myelinationMapper.preview_column(dft['Abnormal myelination'])
column_mapper_d['Abnormal myelination'] = abnormal_myelinationMapper

In [19]:
hydrocephalus_d = {'+ (prenatal)': 'Hydrocephalus',
 '+ (colpocephaly)': 'Colpocephaly',
 '+ (hydranencephaly)': 'Hydranencephaly',
 '+': 'Hydrocephalus',
 '+ (congenital)': 'Hydrocephalus'}
hydrocephalusMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=hydrocephalus_d)
hydrocephalusMapper.preview_column(dft['Hydrocephalus'])
column_mapper_d['Hydrocephalus'] = hydrocephalusMapper

In [20]:
intracranial_d = {'Intracranial hemorrhage (prenatal)': 'Intracranial hemorrhage',
 'Porencephaly': 'Porencephalic cyst',

 'Intracranial hemorrhage': 'Intracranial hemorrhage',
 'Periventricular leukomalacia': 'Periventricular leukomalacia',
 'Cerebral calcification': 'Cerebral calcification',
 'Subependymal periventricular and lenticular nucleus calcifications': 'Intracerebral periventricular calcifications',
 'Bilateral periventricular calcifications': 'Intracerebral periventricular calcifications',
 'Severe cerebral edema': 'Cerebral edema',
 'Diffuse cerebral gliosis': 'Gliosis',
 'Multifocal cerebral white matter abnormalities': 'Multifocal cerebral white matter abnormalities',
 #'Karyorrhexis in the pontine nuclei and hippocampus (dentate gyrus)': 'PLACEHOLDER',
 'Intraparenchymal and periventricular hemorrhages': 'Cerebral hemorrhage',
 'Cerebral calcifications': 'Cerebral calcification',
 'Porencephaly and cerebral cysts': 'Porencephalic cyst',
 'Hemorrahgic ischemic lesions of white matter': 'Cerebral hemorrhage',
 'Cerebral gliosis': 'Gliosis',
 'Calcifications of basal ganglia and thalami': 'Basal ganglia calcification',
 'Periventricular cysts': 'Periventricular cysts',
}
intracranialMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=intracranial_d)
intracranialMapper.preview_column(dft['Intracranial'])
column_mapper_d['Intracranial'] = intracranialMapper

In [21]:
retinal_d = {
 'Arterial tortuosity': 'Arterial tortuosity',
 'Retinal hemorrhage (bilateral)': 'Retinal hemorrhage',
 'Bilateral retinal detachment': 'Retinal detachment',
 'Preretinal and vitreous hemorrhage': 'Vitreous hemorrhage',}
retinalMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=retinal_d)
retinalMapper.preview_column(dft['Retinal'])
column_mapper_d['Retinal'] = retinalMapper

In [22]:
other_findings_d = {'Feeding difficulties (PEG)': 'Feeding difficulties',
 'Pancreatitis': 'Pancreatitis',
 'Iris coloboma': 'Iris coloboma',
 'VSD / FPO': ['Ventricular septal defect',"Patent foramen ovale"],
 'Respiratory insufficiency': 'Respiratory insufficiency',
 'Tracheomalacia': 'Tracheomalacia',
 'Pectus excavatum': 'Pectus excavatum',
 'Gastrostomy': 'Feeding difficulties',
 'PFO': 'Patent foramen ovale',
 #'and hypertrophy of interventricular septum': 'PLACEHOLDER',
 'Nystagmus': 'Nystagmus',
 'Feeding difficulties': 'Feeding difficulties',
 'Severe hydrops fetalis': 'Hydrops fetalis',
 'Septate cystic hygroma': 'Cystic hygroma',
 'Cardiomegaly': 'Cardiomegaly',
 'Tricuspid regurgitation': 'Tricuspid regurgitation',
 'Pulmonary atresia': 'Pulmonary artery atresia',
 'Markedly hypoplastic lungs / atelectasis': 'Pulmonary hypoplasia',
 'Splenic cyst': 'Splenic cyst',
 #'Diffuse bullous skin lesions': 'PLACEHOLDER',
 #'Langerhans cell hyperplasia': 'PLACEHOLDER',
 'Hepatic sinusoidal dilatation / centrilobular congestion': 'Hepatic sinusoidal dilatation',
 }
other_findingsMapper = OptionColumnMapper(concept_recognizer=hpo_cr, option_d=other_findings_d)
other_findingsMapper.preview_column(dft['Other_findings'])
column_mapper_d['Other_findings'] = other_findingsMapper

In [23]:
dft.columns


Index(['ESAM variant (NM_138961.3)', 'NM_138961.3', 'Location',
       'ACMG classification', 'ROH\n(GRCh38/hg38)', 'Sequencing analysis',
       'Chromosomal microarray analysis', 'Further familial segregation data ',
       'Sex', 'Geographical origin', 'Consanguinity', 'Onset of symptoms',
       'Current age', 'Gestational age at delivery', 'Mode of delivery',
       'BirthWeight', 'BirthHeight', 'BirthOFC ', 'APGAR score', 'Age',
       'Weight', 'Height', 'OFC', 'Microcephaly', 'Dysmorphic features',
       'Global developmental delay/unspecified intellectual disability',
       'Delayed speech and language development', 'Hypotonia', 'Spasticity',
       'Epilepsy', 'Dilation of lateral ventricles', 'Thin corpus callosum',
       'Abnormal myelination', 'Hydrocephalus', 'Intracranial', 'Retinal',
       'Other_findings', 'individual_id'],
      dtype='object', name='Clinical features')

In [24]:
var_d = {}
esam_transcript='NM_138961.3' 
varValidator = VariantValidator(genome_build='hg38', transcript=esam_transcript)
for v in dft['NM_138961.3'].unique():
    var = varValidator.encode_hgvs(v)
    var.set_homozygous()
    var_d[v] = var

https://rest.variantvalidator.org/VariantValidator/variantvalidator/hg38/NM_138961.3%3Ac.115del/NM_138961.3?content-type=application%2Fjson
https://rest.variantvalidator.org/VariantValidator/variantvalidator/hg38/NM_138961.3%3Ac.287del/NM_138961.3?content-type=application%2Fjson
https://rest.variantvalidator.org/VariantValidator/variantvalidator/hg38/NM_138961.3%3Ac.35T>A/NM_138961.3?content-type=application%2Fjson
https://rest.variantvalidator.org/VariantValidator/variantvalidator/hg38/NM_138961.3%3Ac.451+1G>A/NM_138961.3?content-type=application%2Fjson
https://rest.variantvalidator.org/VariantValidator/variantvalidator/hg38/NM_138961.3%3Ac.605T>G/NM_138961.3?content-type=application%2Fjson


In [25]:
# TODO ageMapper = AgeColumnMapper(column_name="Current age", ageEncodingType="year")
sexMapper = SexColumnMapper(male_symbol="M", female_symbol="F", column_name="Sex")

In [26]:
varMapper = VariantColumnMapper(variant_d=var_d, variant_column_name='NM_138961.3', default_genotype="homozygous")

encoder = CohortEncoder(df=dft, 
                        hpo_cr=hpo_cr, 
                        column_mapper_d=column_mapper_d, 
                        individual_column_name="individual_id", 
                        agemapper=AgeColumnMapper.not_provided(), 
                        sexmapper=sexMapper,
                        variant_mapper=varMapper,
                        metadata=metadata)

NEDIHSS = Disease(disease_id='OMIM:620371', disease_label='Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity')
encoder.set_disease(NEDIHSS)


In [27]:
individuals = encoder.get_individuals()

Could not parse the following as sex descriptors: Unknown (n=1)


In [28]:
cvalidator = CohortValidator(cohort=individuals, ontology=hpo_ontology, min_hpo=1, allelic_requirement=AllelicRequirement.BI_ALLELIC)
qc = QcVisualizer(cohort_validator=cvalidator)
display(HTML(qc.to_html()))

ID,Level,Category,Message,HPO Term
PMID_36996813_Individual_2,WARNING,REDUNDANT,Decreased body weight is redundant because of Small for gestational age,Decreased body weight (HP:0004325)
PMID_36996813_Individual_1,WARNING,REDUNDANT,Hypertrichosis is redundant because of Synophrys,Hypertrichosis (HP:0000998)
PMID_36996813_Individual_11,WARNING,REDUNDANT,Intracranial hemorrhage is redundant because of Cerebral hemorrhage,Intracranial hemorrhage (HP:0002170)
PMID_36996813_Individual_12,WARNING,REDUNDANT,Intracranial hemorrhage is redundant because of Cerebral hemorrhage,Intracranial hemorrhage (HP:0002170)
PMID_36996813_Individual_4,WARNING,REDUNDANT,Thin corpus callosum is redundant because of Corpus callosum atrophy,Thin corpus callosum (HP:0033725)
PMID_36996813_Individual_12,INFORMATION,NOT_MEASURED,Microcephaly (HP:0000252) was listed as not measured and will be omitted,not measured: Microcephaly (HP:0000252)
PMID_36996813_Individual_13,INFORMATION,NOT_MEASURED,Microcephaly (HP:0000252) was listed as not measured and will be omitted,not measured: Microcephaly (HP:0000252)
PMID_36996813_Individual_KCHYD24-1,INFORMATION,NOT_MEASURED,Microcephaly (HP:0000252) was listed as not measured and will be omitted,not measured: Microcephaly (HP:0000252)


In [29]:
cohort = cvalidator.get_error_free_individual_list()
table = PhenopacketTable(individual_list=individuals, metadata=metadata)
display(HTML(table.to_html()))

Individual,Disease,Genotype,Phenotypic features
Individual 1 (FEMALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Microcephaly (HP:0000252); Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Spastic tetraparesis (HP:0001285); Focal-onset seizure (HP:0007359); Dilated third ventricle (HP:0007082); Thin corpus callosum (HP:0033725); Abnormal CNS myelination (HP:0011400); Hydrocephalus (HP:0000238); Narrow forehead (HP:0000341); Highly arched eyebrow (HP:0002553); Long eyelashes (HP:0000527); Bulbous nose (HP:0000414); Everted lower lip vermilion (HP:0000232); Upslanted palpebral fissure (HP:0000582); Microretrognathia (HP:0000308); Synophrys (HP:0000664); Full cheeks (HP:0000293); Severe global developmental delay (HP:0011344); Inability to walk (HP:0002540); Intracranial hemorrhage (HP:0002170); Porencephalic cyst (HP:0002132); Arterial tortuosity (HP:0005116); Retinal hemorrhage (HP:0000573); Feeding difficulties (HP:0011968); Pancreatitis (HP:0001733)
Individual 2 (MALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Microcephaly (HP:0000252); Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Spastic tetraparesis (HP:0001285); Hyperreflexia (HP:0001347); Seizure (HP:0001250); Dilated third ventricle (HP:0007082); Thin corpus callosum (HP:0033725); Hydrocephalus (HP:0000238); Small for gestational age (HP:0001518); Triangular face (HP:0000325); Smooth philtrum (HP:0000319); Mandibular prognathia (HP:0000303); Severe global developmental delay (HP:0011344); Intracranial hemorrhage (HP:0002170); Periventricular leukomalacia (HP:0006970); Retinal detachment (HP:0000541); Iris coloboma (HP:0000612)
Individual 3 (FEMALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Microcephaly (HP:0000252); Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Seizure (HP:0001250); Dilated third ventricle (HP:0007082); Thin corpus callosum (HP:0033725); Hydrocephalus (HP:0000238); Decreased body weight (HP:0004325); Short stature (HP:0004322); Triangular face (HP:0000325); Smooth philtrum (HP:0000319); Mandibular prognathia (HP:0000303); Severe global developmental delay (HP:0011344); Intracranial hemorrhage (HP:0002170); Periventricular leukomalacia (HP:0006970); Arterial tortuosity (HP:0005116); Vitreous hemorrhage (HP:0007902)
Individual 4 (MALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.287del (homozygous),Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Focal-onset seizure (HP:0007359); Hypsarrhythmia (HP:0002521); Dilated third ventricle (HP:0007082); Corpus callosum atrophy (HP:0007371); Abnormal CNS myelination (HP:0011400); Colpocephaly (HP:0030048); Short stature (HP:0004322); Narrow forehead (HP:0000341); Highly arched eyebrow (HP:0002553); Long eyelashes (HP:0000527); Bulbous nose (HP:0000414); High palate (HP:0000218); Narrow palate (HP:0000189); Tented upper lip vermilion (HP:0010804); Hammertoe (HP:0001765); Telecanthus (HP:0000506); Wide nasal bridge (HP:0000431); Finger joint hypermobility (HP:0006094); Talipes equinovarus (HP:0001762); Amblyopia (HP:0000646); Severe global developmental delay (HP:0011344); Poor head control (HP:0002421); Delayed ability to sit (HP:0025336); Intracranial hemorrhage (HP:0002170); Cerebral calcification (HP:0002514); Respiratory insufficiency (HP:0002093); Tracheomalacia (HP:0002779); Pectus excavatum (HP:0000767); excluded: Microcephaly (HP:0000252)
Individual 5 (FEMALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.287del (homozygous),Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Focal-onset seizure (HP:0007359); Hypsarrhythmia (HP:0002521); Dilated third ventricle (HP:0007082); Thin corpus callosum (HP:0033725); Abnormal CNS myelination (HP:0011400); Hydrocephalus (HP:0000238); Narrow forehead (HP:0000341); Highly arched eyebrow (HP:0002553); Long eyelashes (HP:0000527); Bulbous nose (HP:0000414); High palate (HP:0000218); Narrow palate (HP:0000189); Tented upper lip vermilion (HP:0010804); Hammertoe (HP:0001765); Telecanthus (HP:0000506); Wide nasal bridge (HP:0000431); Finger joint hypermobility (HP:0006094); Talipes equinovarus (HP:0001762); Amblyopia (HP:0000646); Severe global developmental delay (HP:0011344); Poor head control (HP:0002421); Delayed ability to sit (HP:0025336); Intracranial hemorrhage (HP:0002170); Cerebral calcification (HP:0002514); Respiratory insufficiency (HP:0002093); Tracheomalacia (HP:0002779); Pectus excavatum (HP:0000767); excluded: Microcephaly (HP:0000252)
Individual 6 (MALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.35T>A (homozygous),Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Spastic tetraparesis (HP:0001285); Seizure (HP:0001250); Dilated third ventricle (HP:0007082); Thin corpus callosum (HP:0033725); Partial absence of the septum pellucidum (HP:0030283); Hydranencephaly (HP:0002324); Decreased body weight (HP:0004325); Severe global developmental delay (HP:0011344); Delayed ability to sit (HP:0025336); Inability to walk (HP:0002540); Intracranial hemorrhage (HP:0002170); Retinal hemorrhage (HP:0000573); excluded: Microcephaly (HP:0000252)
Individual 7 (MALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Spastic tetraparesis (HP:0001285); Bilateral tonic-clonic seizure (HP:0002069); Dilated third ventricle (HP:0007082); Wide nasal bridge (HP:0000431); Smooth philtrum (HP:0000319); Upslanted palpebral fissure (HP:0000582); Broad forehead (HP:0000337); Narrow forehead (HP:0000341); Severe global developmental delay (HP:0011344); Delayed ability to sit (HP:0025336); Inability to walk (HP:0002540); Intracerebral periventricular calcifications (HP:0007229); Feeding difficulties (HP:0011968); excluded: Microcephaly (HP:0000252); excluded: Thin corpus callosum (HP:0033725)
Individual 8 (MALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Dystonia (HP:0001332); Seizure (HP:0001250); Dilated third ventricle (HP:0007082); Thin corpus callosum (HP:0033725); Abnormal CNS myelination (HP:0011400); Decreased body weight (HP:0004325); Narrow forehead (HP:0000341); Highly arched eyebrow (HP:0002553); Long eyelashes (HP:0000527); Bulbous nose (HP:0000414); High palate (HP:0000218); Narrow palate (HP:0000189); Everted lower lip vermilion (HP:0000232); Hammertoe (HP:0001765); Upslanted palpebral fissure (HP:0000582); Microretrognathia (HP:0000308); Cryptorchidism (HP:0000028); Severe global developmental delay (HP:0011344); Poor head control (HP:0002421); Intracranial hemorrhage (HP:0002170); Cerebral calcification (HP:0002514); Patent foramen ovale (HP:0001655); Nystagmus (HP:0000639); excluded: Microcephaly (HP:0000252)
Individual 9 (MALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.451+1G>A (homozygous),Microcephaly (HP:0000252); Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Limb hypertonia (HP:0002509); Focal-onset seizure (HP:0007359); Dilated third ventricle (HP:0007082); Lateral ventricle dilatation (HP:0006956); Thin corpus callosum (HP:0033725); Abnormal CNS myelination (HP:0011400); Hydrocephalus (HP:0000238); Decreased body weight (HP:0004325); Short stature (HP:0004322); Narrow forehead (HP:0000341); Highly arched eyebrow (HP:0002553); Bulbous nose (HP:0000414); Posteriorly rotated ears (HP:0000358); Severe global developmental delay (HP:0011344); Poor head control (HP:0002421); Delayed ability to sit (HP:0025336); Intracranial hemorrhage (HP:0002170); Intracerebral periventricular calcifications (HP:0007229); Feeding difficulties (HP:0011968)
Individual 10 (MALE; ),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Dilated third ventricle (HP:0007082); Hydrocephalus (HP:0000238); Anteverted nares (HP:0000463); Microretrognathia (HP:0000308); Talipes equinovarus (HP:0001762); Intracranial hemorrhage (HP:0002170); Cerebral edema (HP:0002181); Periventricular leukomalacia (HP:0006970); Gliosis (HP:0002171); Multifocal cerebral white matter abnormalities (HP:0007052); Hydrops fetalis (HP:0001789); Cystic hygroma (HP:0000476); Cardiomegaly (HP:0001640); Tricuspid regurgitation (HP:0005180); Pulmonary artery atresia (HP:0004935); Pulmonary hypoplasia (HP:0002089); Atelectasis (HP:0100750); Splenic cyst (HP:0030423); Hepatic sinusoidal dilatation (HP:0035006); excluded: Microcephaly (HP:0000252); excluded: Thin corpus callosum (HP:0033725)


In [30]:
Individual.output_individuals_as_phenopackets(individual_list=individuals,
                                              metadata=metadata)

We output 14 GA4GH phenopackets to the directory phenopackets


# Output an HPO aggregate annotation file
First collect counts of onset

In [31]:
dft['Onset of symptoms'].value_counts()

Onset of symptoms
Neonatal             6
Antenatal            3
Antenatal (33 w)     1
Antenatal (26 wg)    1
Antenatal (33 wg)    1
Antenatal (21 w)     1
n.a.                 1
Name: count, dtype: int64

In [32]:
ppkt_list = [i.to_ga4gh_phenopacket(metadata=metadata) for i in individuals]
hpoa_creatr = HpoaTableBuilder(phenopacket_list=ppkt_list).neonatal_onset(6,13).antenatal_onset(3,13).third_trimester_onset(2,13).second_trimester_onset(2,13).build()

We found a total of 86 HPO terms
extracted PubMed identifier: PMID:36996813
Extracted disease: Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)


In [33]:
df = hpoa_creatr.get_dataframe()
df

Unnamed: 0,#diseaseID,diseaseName,phenotypeID,phenotypeName,onsetID,onsetName,frequency,sex,negation,modifier,description,publication,evidence,biocuration
0,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0007082,Dilated third ventricle,,,13/13,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
1,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0000476,Cystic hygroma,,,1/1,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
2,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0000750,Delayed speech and language development,,,9/9,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
3,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0001285,Spastic tetraparesis,,,4/4,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
4,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0011344,Severe global developmental delay,,,9/9,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
85,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0001332,Dystonia,,,1/1,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
86,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0003623,Neonatal onset,,,6/13,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
87,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0030674,Antenatal onset,,,3/13,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
88,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0034197,Third trimester onset,,,2/13,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155


In [34]:
hpoa_creatr.write_data_frame()

Wrote HPOA disease file to OMIM-620371.tab
