# ESAM

Data extracted from [Lecca M, et al. (2023) Bi-allelic variants in the ESAM tight-junction gene cause a neurodevelopmental disorder associated with fetal intracranial hemorrhage. Am J Hum Genet ;110(4):681-690.  PMID:36996813](https://pubmed.ncbi.nlm.nih.gov/36996813/)

In [1]:
import pandas as pd
pd.set_option('display.max_colwidth', None) # show entire column contents, important!
from IPython.display import display, HTML
from pyphetools.creation import *
from pyphetools.visualization import *
from pyphetools.validation import *
import pyphetools
print(f"Using pyphetools version {pyphetools.__version__}")

Using pyphetools version 0.9.63


In [2]:
PMID = "PMID:36996813"
title = "Bi-allelic variants in the ESAM tight-junction gene cause a neurodevelopmental disorder associated with fetal intracranial hemorrhage"
cite = Citation(pmid=PMID, title=title)
parser = HpoParser("../hp.json")
hpo_cr = parser.get_hpo_concept_recognizer()
hpo_version = parser.get_version()
hpo_ontology = parser.get_ontology()
metadata = MetaData(created_by="ORCID:0000-0002-5648-2155", citation=cite)
metadata.default_versions_with_hpo(version=hpo_version)
print(f"HPO version {hpo_version}")

HPO version 2024-02-27


In [3]:
df = pd.read_excel("input/esam_lecca_2023.xlsx");
dft = df.transpose()
dft.columns = dft.iloc[0]
dft.drop(dft.index[0], inplace=True)
dft.index  # first check the index
dft['individual_id'] = dft.index  # Set the new column 'patient_id' to be identical to the contents of the index
#dft.head() # c

In [4]:
generator = SimpleColumnMapperGenerator(df=dft, hpo_cr=hpo_cr, observed="+", excluded="-")
column_mapper_list = generator.try_mapping_columns()
display(HTML(generator.to_html()))

Result,Columns
Mapped,Microcephaly; Delayed speech and language development; Hypotonia; Spasticity; Epilepsy; Dilation of lateral ventricles; Thin corpus callosum; Abnormal myelination; Hydrocephalus
Unmapped,ESAM variant (NM_138961.3); NM_138961.3; Location; ACMG classification; ROH (GRCh38/hg38); Sequencing analysis; Chromosomal microarray analysis; Further familial segregation data ; Sex; Geographical origin; Consanguinity; age_of_onset; Onset of symptoms; Current age; Gestational age at delivery; Mode of delivery; BirthWeight; BirthHeight; BirthOFC ; APGAR score; Age; Weight; Height; OFC; Dysmorphic features; Global developmental delay/unspecified intellectual disability; Intracranial; Retinal; Other_findings; individual_id


In [5]:
#res = OptionColumnMapper.autoformat(df=dft, concept_recognizer=hpo_cr, omit_columns=generator.get_mapped_columns())
#print(res)

In [6]:
birthweight_d = {
 '2150 g (<3rd percentile)': 'Small for gestational age',
}
birthweight_Mapper = OptionColumnMapper(column_name='BirthWeight', concept_recognizer=hpo_cr, option_d=birthweight_d)
column_mapper_list.append(birthweight_Mapper)
birthweight_Mapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Small for gestational age (HP:0001518) (observed),1


In [7]:
weight_d = {
 '12 kg (<3rd percentile)': 'Decreased body weight',
 '7.6 kg (<3rd percentile)': 'Decreased body weight',
 '8.07 kg (<3rd percentile)': 'Decreased body weight',
 '17 kg (<3rd percentile)': 'Decreased body weight',
 '7.9 kg (<3rd percentile)': 'Decreased body weight',
}
weight_Mapper = OptionColumnMapper(column_name='Weight',concept_recognizer=hpo_cr, option_d=weight_d)
column_mapper_list.append(weight_Mapper)
weight_Mapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Decreased body weight (HP:0004325) (observed),5


In [8]:
height_d = {
 '78 cm (<3rd percentile)': 'Short stature',
 '97 cm (<3rd percentile)': 'Short stature',
 '73 cm (<3rd percentile)': 'Short stature',
}
heightMapper = OptionColumnMapper(column_name='Height',concept_recognizer=hpo_cr, option_d=height_d)
column_mapper_list.append(heightMapper)
heightMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Short stature (HP:0004322) (observed),3


In [9]:
# Microcephaly HP:0000252
microcephaly_Mapper = SimpleColumnMapper(column_name='Microcephaly',
                                         hpo_id="HP:0000252", hpo_label="Microcephaly", observed="+", excluded="-")
column_mapper_list.append(microcephaly_Mapper)
microcephaly_Mapper.preview_column(dft)

Unnamed: 0,mapping,count
0,"original value: ""+ "" -> HP: Microcephaly (HP:0000252) (observed)",1
1,"original value: ""+"" -> HP: Microcephaly (HP:0000252) (observed)",3
2,"original value: ""-"" -> HP: Microcephaly (HP:0000252) (excluded)",7
3,"original value: ""nan"" -> HP: Microcephaly (HP:0000252) (not measured)",2
4,"original value: ""n.a."" -> HP: Microcephaly (HP:0000252) (not measured)",1


In [10]:
dysmorphic_features_d = {'Bitemporal narrowing': 'Narrow forehead',
 'Highly arched eyebrow': 'Highly arched eyebrow',
 'Long eyelashes': 'Long eyelashes',
 'Bulbous nasal tip': 'Bulbous nose',
 'Fleshy and everted lower lip vermilion': 'Everted lower lip vermilion',
 'Upslanted palpebral fissure': 'Upslanted palpebral fissure',
 'Microretrognathia': 'Microretrognathia',
 'Synophrys': 'Synophrys',
 'Full cheeks': 'Full cheeks',
 'Hypertrichosis': 'Hypertrichosis',
 'Triangular face': 'Triangular face',
 'Smooth philtrum': 'Smooth philtrum',
 'Prominent chin': 'Mandibular prognathia',
 'High palate': 'High palate',
 'narrow palate': 'Narrow palate',
 'Tented upper lip vermilion': 'Tented upper lip vermilion',
 'Hammertoe': 'Hammertoe',
 'Telecanthus': 'Telecanthus',
 'Wide nasal bridge': 'Wide nasal bridge',
 'Finger joint hypermobility': 'Finger joint hypermobility',
 'Talipes equinovarus': 'Talipes equinovarus',
 'Amblyopia': 'Amblyopia',
 'Flat philtrum': 'Smooth philtrum',
 'Upslanted palpebral fissures': 'Upslanted palpebral fissure',
 'Broad forehead': 'Broad forehead',
 'Undescended testicle': 'Cryptorchidism',
 'Highly arched eyebrows': 'Highly arched eyebrow',
 'Low posteriorly rotated ears': 'Posteriorly rotated ears',
 'Anteverted nares': 'Anteverted nares',
}
dysmorphic_featuresMapper = OptionColumnMapper(column_name='Dysmorphic features',concept_recognizer=hpo_cr, option_d=dysmorphic_features_d)
column_mapper_list.append(dysmorphic_featuresMapper)
dysmorphic_featuresMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Narrow forehead (HP:0000341) (observed),6
1,Highly arched eyebrow (HP:0002553) (observed),5
2,Long eyelashes (HP:0000527) (observed),4
3,Bulbous nose (HP:0000414) (observed),5
4,Everted lower lip vermilion (HP:0000232) (observed),2
5,Upslanted palpebral fissure (HP:0000582) (observed),3
6,Microretrognathia (HP:0000308) (observed),3
7,Synophrys (HP:0000664) (observed),1
8,Full cheeks (HP:0000293) (observed),1
9,Hypertrichosis (HP:0000998) (observed),1


In [11]:
gdd_d = {'+ (severe)': 'Severe global developmental delay',
 'No walking': 'Inability to walk',
 'Poor head control': 'Poor head control',
 'No sitting': 'Delayed ability to sit',
 '[@[Individual 7]]No walking': 'Inability to walk',
 '(does not sit nor roll over)': 'Delayed ability to sit',
}
gddMapper = OptionColumnMapper(column_name='Global developmental delay/unspecified intellectual disability',
                               concept_recognizer=hpo_cr, option_d=gdd_d)
column_mapper_list.append(gddMapper)
gddMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Severe global developmental delay (HP:0011344) (observed),9
1,Inability to walk (HP:0002540) (observed),3
2,Poor head control (HP:0002421) (observed),4
3,Delayed ability to sit (HP:0025336) (observed),5


In [12]:
speech_d = {'+ (severe)': 'Delayed speech and language development',
              '+': 'Delayed speech and language development',
}
speechMapper = OptionColumnMapper(column_name='Delayed speech and language development',
                                                                   concept_recognizer=hpo_cr, option_d=speech_d)
column_mapper_list.append(speechMapper)
speechMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Delayed speech and language development (HP:0000750) (observed),9


In [13]:
hypotonia__d = {'+ (neonatal)': 'Hypotonia',
 'neonatal': 'Hypotonia',
 '+': 'Hypotonia',
 }
hypotonia_Mapper = OptionColumnMapper(column_name='Hypotonia',concept_recognizer=hpo_cr, option_d=hypotonia__d)
column_mapper_list.append(hypotonia_Mapper)
hypotonia_Mapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Hypotonia (HP:0001252) (observed),9


In [14]:
spasticity__d = {'+ (spastic tetraparesis)': 'Spastic tetraparesis',
 '+ (spastic tetraparesis': 'Spastic tetraparesis',
 'hyperreflexia)': 'Hyperreflexia',
 '+  (spastic tetraparesis)': 'Spastic tetraparesis',
 '+ (dystonia)': 'Dystonia',
 '+ (limb hypertonia)': 'Limb hypertonia',
}
spasticity_Mapper = OptionColumnMapper(column_name='Spasticity',concept_recognizer=hpo_cr, option_d=spasticity__d)
column_mapper_list.append(spasticity_Mapper)
spasticity_Mapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Spastic tetraparesis (HP:0001285) (observed),4
1,Hyperreflexia (HP:0001347) (observed),1
2,Dystonia (HP:0001332) (observed),1
3,Limb hypertonia (HP:0002509) (observed),1


In [15]:
epilepsy_d = {'+ (focal)': 'Focal-onset seizure',
 '+': 'Seizure',
 '+ (focal': 'Focal-onset seizure',
 'myoclonic) \nHypsarrhythmia': 'Hypsarrhythmia',
 'myoclonic) Hypsarrhythmia': 'Hypsarrhythmia',
 '+ (generalized tonic-clonic seizures)': 'Bilateral tonic-clonic seizure',
}
epilepsyMapper = OptionColumnMapper(column_name='Epilepsy',concept_recognizer=hpo_cr, option_d=epilepsy_d)
column_mapper_list.append(epilepsyMapper)
epilepsyMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Focal-onset seizure (HP:0007359) (observed),4
1,Seizure (HP:0001250) (observed),4
2,Hypsarrhythmia (HP:0002521) (observed),2
3,Bilateral tonic-clonic seizure (HP:0002069) (observed),1


In [16]:
lateral_ventricles_d = {'+': 'Dilated third ventricle',
 '+ (lateral and 3rd ventricles)': ["Dilated third ventricle", "Lateral ventricle dilatation"],
}
lateral_ventricles_Mapper = OptionColumnMapper(column_name='Dilation of lateral ventricles',
                                                           concept_recognizer=hpo_cr, option_d=lateral_ventricles_d)
column_mapper_list.append(lateral_ventricles_Mapper)
lateral_ventricles_Mapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Dilated third ventricle (HP:0007082) (observed),13
1,Lateral ventricle dilatation (HP:0006956) (observed),1


In [17]:
thinCC_d = {'+ (atrophy)': ["Corpus callosum atrophy", 'Thin corpus callosum'],
 '+ (partial absence of the septum pellucidum)': ['Thin corpus callosum','Partial absence of the septum pellucidum'],
 '+': 'Thin corpus callosum',
}
excluded = {'-': 'Thin corpus callosum'}
thincc_Mapper = OptionColumnMapper(column_name='Thin corpus callosum',
                                                concept_recognizer=hpo_cr, option_d=thinCC_d, excluded_d=excluded)
column_mapper_list.append(thincc_Mapper)
thincc_Mapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Thin corpus callosum (HP:0033725) (observed),10
1,Corpus callosum atrophy (HP:0007371) (observed),1
2,Partial absence of the septum pellucidum (HP:0030283) (observed),1
3,Thin corpus callosum (HP:0033725) (excluded),3


In [18]:
myelination_d = {'+ (FWML)': 'Abnormal CNS myelination',
 '+ (FWML - frontoparietal)': 'Abnormal CNS myelination',
 '+ (FWML - periventricular)': 'Abnormal CNS myelination',
 '+ (dysgiria/polymicrogyria': 'Polymicrogyria',
 'white matter volume loss)': 'Reduced cerebral white matter volume',
}
abnormal_myelinationMapper = OptionColumnMapper(column_name='Abnormal myelination',
                                                concept_recognizer=hpo_cr, option_d=myelination_d)
column_mapper_list.append(abnormal_myelinationMapper)
abnormal_myelinationMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Abnormal CNS myelination (HP:0011400) (observed),6
1,Polymicrogyria (HP:0002126) (observed),1
2,Reduced cerebral white matter volume (HP:0034295) (observed),1


In [19]:
hydrocephalus_d = {'+ (prenatal)': 'Hydrocephalus',
 '+ (colpocephaly)': 'Colpocephaly',
 '+ (hydranencephaly)': 'Hydranencephaly',
 '+': 'Hydrocephalus',
 '+ (congenital)': 'Hydrocephalus'}
hydrocephalusMapper = OptionColumnMapper(column_name='Hydrocephalus',concept_recognizer=hpo_cr, option_d=hydrocephalus_d)
column_mapper_list.append(hydrocephalusMapper)
hydrocephalusMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Hydrocephalus (HP:0000238) (observed),10
1,Colpocephaly (HP:0030048) (observed),1
2,Hydranencephaly (HP:0002324) (observed),1


In [20]:
intracranial_d = {'Intracranial hemorrhage (prenatal)': 'Intracranial hemorrhage',
 'Porencephaly': 'Porencephalic cyst',
 'Intracranial hemorrhage': 'Intracranial hemorrhage',
 'Periventricular leukomalacia': 'Periventricular leukomalacia',
 'Cerebral calcification': 'Cerebral calcification',
 'Subependymal periventricular and lenticular nucleus calcifications': 'Intracerebral periventricular calcifications',
 'Bilateral periventricular calcifications': 'Intracerebral periventricular calcifications',
 'Severe cerebral edema': 'Cerebral edema',
 'Diffuse cerebral gliosis': 'Gliosis',
 'Multifocal cerebral white matter abnormalities': 'Multifocal cerebral white matter abnormalities',
 #'Karyorrhexis in the pontine nuclei and hippocampus (dentate gyrus)': 'PLACEHOLDER',
 'Intraparenchymal and periventricular hemorrhages': 'Cerebral hemorrhage',
 'Cerebral calcifications': 'Cerebral calcification',
 'Porencephaly and cerebral cysts': 'Porencephalic cyst',
 'Hemorrahgic ischemic lesions of white matter': 'Cerebral hemorrhage',
 'Cerebral gliosis': 'Gliosis',
 'Calcifications of basal ganglia and thalami': 'Basal ganglia calcification',
 'Periventricular cysts': 'Periventricular cysts',
}
intracranialMapper = OptionColumnMapper(column_name='Intracranial',concept_recognizer=hpo_cr, option_d=intracranial_d)
column_mapper_list.append(intracranialMapper)
intracranialMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Intracranial hemorrhage (HP:0002170) (observed),12
1,Porencephalic cyst (HP:0002132) (observed),2
2,Periventricular leukomalacia (HP:0006970) (observed),3
3,Cerebral calcification (HP:0002514) (observed),5
4,Intracerebral periventricular calcifications (HP:0007229) (observed),2
5,Cerebral edema (HP:0002181) (observed),1
6,Gliosis (HP:0002171) (observed),2
7,Multifocal cerebral white matter abnormalities (HP:0007052) (observed),1
8,Cerebral hemorrhage (HP:0001342) (observed),2
9,Basal ganglia calcification (HP:0002135) (observed),1


In [21]:
retinal_d = {
 'Arterial tortuosity': 'Retinal arterial tortuosity',
 'Retinal hemorrhage (bilateral)': 'Retinal hemorrhage',
 'Bilateral retinal detachment': 'Retinal detachment',
 'Preretinal and vitreous hemorrhage': 'Vitreous hemorrhage',}
retinalMapper = OptionColumnMapper(column_name='Retinal',concept_recognizer=hpo_cr, option_d=retinal_d)
column_mapper_list.append(retinalMapper)
retinalMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Retinal arterial tortuosity (HP:0000631) (observed),2
1,Retinal hemorrhage (HP:0000573) (observed),2
2,Retinal detachment (HP:0000541) (observed),1
3,Vitreous hemorrhage (HP:0007902) (observed),1


In [22]:
other_d = {'Feeding difficulties (PEG)': 'Feeding difficulties',
 'Pancreatitis': 'Pancreatitis',
 'Iris coloboma': 'Iris coloboma',
 'VSD / FPO': ['Ventricular septal defect',"Patent foramen ovale"],
 'Respiratory insufficiency': 'Respiratory insufficiency',
 'Tracheomalacia': 'Tracheomalacia',
 'Pectus excavatum': 'Pectus excavatum',
 'Gastrostomy': 'Feeding difficulties',
 'PFO': 'Patent foramen ovale',
 #'and hypertrophy of interventricular septum': 'PLACEHOLDER',
 'Nystagmus': 'Nystagmus',
 'Feeding difficulties': 'Feeding difficulties',
 'Severe hydrops fetalis': 'Hydrops fetalis',
 'Septate cystic hygroma': 'Cystic hygroma',
 'Cardiomegaly': 'Cardiomegaly',
 'Tricuspid regurgitation': 'Tricuspid regurgitation',
 'Pulmonary atresia': 'Pulmonary artery atresia',
 'Markedly hypoplastic lungs / atelectasis': 'Pulmonary hypoplasia',
 'Splenic cyst': 'Splenic cyst',
 #'Diffuse bullous skin lesions': 'PLACEHOLDER',
 #'Langerhans cell hyperplasia': 'PLACEHOLDER',
 'Hepatic sinusoidal dilatation / centrilobular congestion': 'Hepatic sinusoidal dilatation',
 }
other_findingsMapper = OptionColumnMapper(column_name='Other_findings',concept_recognizer=hpo_cr, option_d=other_d)
column_mapper_list.append(other_findingsMapper)
other_findingsMapper.preview_column(dft)

Unnamed: 0,mapping,count
0,Feeding difficulties (HP:0011968) (observed),3
1,Pancreatitis (HP:0001733) (observed),1
2,Iris coloboma (HP:0000612) (observed),1
3,Respiratory insufficiency (HP:0002093) (observed),2
4,Tracheomalacia (HP:0002779) (observed),2
5,Pectus excavatum (HP:0000767) (observed),2
6,Patent foramen ovale (HP:0001655) (observed),1
7,Nystagmus (HP:0000639) (observed),1
8,Hydrops fetalis (HP:0001789) (observed),1
9,Cystic hygroma (HP:0000476) (observed),1


In [23]:
esam_transcript='NM_138961.3' 
vman = VariantManager(df=dft, 
                      individual_column_name="individual_id", 
                      gene_symbol="ESAM", 
                      transcript=esam_transcript,
                      allele_1_column_name='NM_138961.3')

var_d = vman.get_variant_d()

In [24]:
sexMapper = SexColumnMapper(male_symbol="M", female_symbol="F", column_name="Sex")

In [25]:
iso8601_d = {'10 y':'P10Y',
            '4y 9m': 'P4Y9M', 
            '2y 3m':'P2Y3M', 
             'Deceased (5y 6m)':'P5Y6M', 
             '2y 11m':'P2Y11M',
       'Deceased (13 m)':'P1Y1M', 
             '13 y':'P13Y',
             '7 y':'P7Y',
             '19 m':'P1Y7M',
             }
ageMapper = AgeColumnMapper.custom_dictionary(column_name="Current age", string_to_iso_d=iso8601_d)
#ageMapper.preview_column(dft)
onsetMapper = AgeColumnMapper.hpo_onset("age_of_onset")
onsetMapper.preview_column(dft)

Unnamed: 0,original column contents,age
0,Neonatal onset,Neonatal onset
1,Antenatal onset,Antenatal onset
2,NOT_PROVIDED,


In [33]:
varMapper = VariantColumnMapper(variant_d=var_d, variant_column_name='NM_138961.3', default_genotype="homozygous")

encoder = CohortEncoder(df=dft, 
                        hpo_cr=hpo_cr, 
                        column_mapper_list=column_mapper_list, 
                        individual_column_name="individual_id", 
                        age_at_last_encounter_mapper=ageMapper, 
                        age_of_onset_mapper=onsetMapper,
                        sexmapper=sexMapper,
                        variant_mapper=varMapper,
                        metadata=metadata)

NEDIHSS = Disease(disease_id='OMIM:620371', disease_label='Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity')
encoder.set_disease(NEDIHSS)

In [34]:
individuals = encoder.get_individuals()

Could not parse the following as ISO8601 ages: nan (n=2)
Could not parse the following as sex descriptors: Unknown (n=2)


In [35]:
cvalidator = CohortValidator(cohort=individuals, ontology=hpo_ontology, min_hpo=1, allelic_requirement=AllelicRequirement.BI_ALLELIC)
qc = QcVisualizer(cohort_validator=cvalidator)
display(HTML(qc.to_summary_html()))

Level,Error category,Count
WARNING,REDUNDANT,5
INFORMATION,NOT_MEASURED,61


In [36]:
cohort = cvalidator.get_error_free_individual_list()
table = PhenopacketTable(individual_list=individuals, metadata=metadata)
display(HTML(table.to_html()))

Individual,Disease,Genotype,Phenotypic features
Individual 1 (FEMALE; P10Y),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Severe global developmental delay (HP:0011344); Retinal hemorrhage (HP:0000573); Intracranial hemorrhage (HP:0002170); Delayed speech and language development (HP:0000750); Bulbous nose (HP:0000414); Hypotonia (HP:0001252); Hydrocephalus (HP:0000238); Everted lower lip vermilion (HP:0000232); Feeding difficulties (HP:0011968); Focal-onset seizure (HP:0007359); Porencephalic cyst (HP:0002132); Full cheeks (HP:0000293); Retinal arterial tortuosity (HP:0000631); Narrow forehead (HP:0000341); Thin corpus callosum (HP:0033725); Highly arched eyebrow (HP:0002553); Pancreatitis (HP:0001733); Microcephaly (HP:0000252); Spastic tetraparesis (HP:0001285); Synophrys (HP:0000664); Dilated third ventricle (HP:0007082); Inability to walk (HP:0002540); Microretrognathia (HP:0000308); Long eyelashes (HP:0000527); Lateral ventricle dilatation (HP:0006956); Upslanted palpebral fissure (HP:0000582); Abnormal CNS myelination (HP:0011400)
Individual 2 (MALE; P4Y9M),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Severe global developmental delay (HP:0011344); Intracranial hemorrhage (HP:0002170); Small for gestational age (HP:0001518); Seizure (HP:0001250); Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Hydrocephalus (HP:0000238); Mandibular prognathia (HP:0000303); Iris coloboma (HP:0000612); Periventricular leukomalacia (HP:0006970); Thin corpus callosum (HP:0033725); Retinal detachment (HP:0000541); Microcephaly (HP:0000252); Spastic tetraparesis (HP:0001285); Dilated third ventricle (HP:0007082); Hyperreflexia (HP:0001347); Triangular face (HP:0000325); Smooth philtrum (HP:0000319); Lateral ventricle dilatation (HP:0006956); excluded: Abnormal myelination (HP:0012447)
Individual 3 (FEMALE; P2Y3M),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Severe global developmental delay (HP:0011344); Intracranial hemorrhage (HP:0002170); Seizure (HP:0001250); Short stature (HP:0004322); Delayed speech and language development (HP:0000750); Hypotonia (HP:0001252); Hydrocephalus (HP:0000238); Decreased body weight (HP:0004325); Mandibular prognathia (HP:0000303); Retinal arterial tortuosity (HP:0000631); Periventricular leukomalacia (HP:0006970); Thin corpus callosum (HP:0033725); Microcephaly (HP:0000252); Dilated third ventricle (HP:0007082); Spasticity (HP:0001257); Vitreous hemorrhage (HP:0007902); Triangular face (HP:0000325); Smooth philtrum (HP:0000319); Lateral ventricle dilatation (HP:0006956); excluded: Abnormal myelination (HP:0012447)
Individual 4 (MALE; P5Y6M),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.287del (homozygous),Severe global developmental delay (HP:0011344); Delayed ability to sit (HP:0025336); Intracranial hemorrhage (HP:0002170); Finger joint hypermobility (HP:0006094); Poor head control (HP:0002421); Short stature (HP:0004322); Telecanthus (HP:0000506); Delayed speech and language development (HP:0000750); Bulbous nose (HP:0000414); Hypotonia (HP:0001252); Hammertoe (HP:0001765); Narrow palate (HP:0000189); Corpus callosum atrophy (HP:0007371); Focal-onset seizure (HP:0007359); Tented upper lip vermilion (HP:0010804); High palate (HP:0000218); Wide nasal bridge (HP:0000431); Narrow forehead (HP:0000341); Hypsarrhythmia (HP:0002521); Highly arched eyebrow (HP:0002553); Amblyopia (HP:0000646); Pectus excavatum (HP:0000767); Cerebral calcification (HP:0002514); Tracheomalacia (HP:0002779); Talipes equinovarus (HP:0001762); Dilated third ventricle (HP:0007082); Respiratory insufficiency (HP:0002093); Spasticity (HP:0001257); Colpocephaly (HP:0030048); Long eyelashes (HP:0000527); Lateral ventricle dilatation (HP:0006956); Abnormal CNS myelination (HP:0011400); excluded: Microcephaly (HP:0000252)
Individual 5 (FEMALE; P2Y11M),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.287del (homozygous),Severe global developmental delay (HP:0011344); Delayed ability to sit (HP:0025336); Intracranial hemorrhage (HP:0002170); Finger joint hypermobility (HP:0006094); Poor head control (HP:0002421); Telecanthus (HP:0000506); Delayed speech and language development (HP:0000750); Bulbous nose (HP:0000414); Hypotonia (HP:0001252); Hydrocephalus (HP:0000238); Hammertoe (HP:0001765); Narrow palate (HP:0000189); Focal-onset seizure (HP:0007359); Tented upper lip vermilion (HP:0010804); High palate (HP:0000218); Wide nasal bridge (HP:0000431); Narrow forehead (HP:0000341); Thin corpus callosum (HP:0033725); Hypsarrhythmia (HP:0002521); Highly arched eyebrow (HP:0002553); Amblyopia (HP:0000646); Pectus excavatum (HP:0000767); Cerebral calcification (HP:0002514); Tracheomalacia (HP:0002779); Talipes equinovarus (HP:0001762); Dilated third ventricle (HP:0007082); Respiratory insufficiency (HP:0002093); Spasticity (HP:0001257); Long eyelashes (HP:0000527); Lateral ventricle dilatation (HP:0006956); Abnormal CNS myelination (HP:0011400); excluded: Microcephaly (HP:0000252)
Individual 6 (MALE; P1Y1M),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.35T>A (homozygous),Hypotonia (HP:0001252); Severe global developmental delay (HP:0011344); Delayed ability to sit (HP:0025336); Dilated third ventricle (HP:0007082); Partial absence of the septum pellucidum (HP:0030283); Inability to walk (HP:0002540); Retinal hemorrhage (HP:0000573); Intracranial hemorrhage (HP:0002170); Hydranencephaly (HP:0002324); Thin corpus callosum (HP:0033725); Seizure (HP:0001250); Decreased body weight (HP:0004325); Lateral ventricle dilatation (HP:0006956); Spastic tetraparesis (HP:0001285); Delayed speech and language development (HP:0000750); excluded: Abnormal myelination (HP:0012447); excluded: Microcephaly (HP:0000252)
Individual 7 (MALE; P13Y),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Hypotonia (HP:0001252); Severe global developmental delay (HP:0011344); Delayed ability to sit (HP:0025336); Spastic tetraparesis (HP:0001285); Dilated third ventricle (HP:0007082); Broad forehead (HP:0000337); Inability to walk (HP:0002540); Wide nasal bridge (HP:0000431); Narrow forehead (HP:0000341); Intracerebral periventricular calcifications (HP:0007229); Smooth philtrum (HP:0000319); Lateral ventricle dilatation (HP:0006956); Feeding difficulties (HP:0011968); Upslanted palpebral fissure (HP:0000582); Delayed speech and language development (HP:0000750); Bilateral tonic-clonic seizure (HP:0002069); excluded: Hydrocephalus (HP:0000238); excluded: Abnormal myelination (HP:0012447); excluded: Thin corpus callosum (HP:0033725); excluded: Microcephaly (HP:0000252)
Individual 8 (MALE; P7Y),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Severe global developmental delay (HP:0011344); Intracranial hemorrhage (HP:0002170); Poor head control (HP:0002421); Seizure (HP:0001250); Dystonia (HP:0001332); Delayed speech and language development (HP:0000750); Patent foramen ovale (HP:0001655); Bulbous nose (HP:0000414); Hypotonia (HP:0001252); Everted lower lip vermilion (HP:0000232); Decreased body weight (HP:0004325); Hammertoe (HP:0001765); Narrow palate (HP:0000189); High palate (HP:0000218); Nystagmus (HP:0000639); Narrow forehead (HP:0000341); Thin corpus callosum (HP:0033725); Highly arched eyebrow (HP:0002553); Cryptorchidism (HP:0000028); Cerebral calcification (HP:0002514); Dilated third ventricle (HP:0007082); Microretrognathia (HP:0000308); Long eyelashes (HP:0000527); Lateral ventricle dilatation (HP:0006956); Upslanted palpebral fissure (HP:0000582); Abnormal CNS myelination (HP:0011400); excluded: Hydrocephalus (HP:0000238); excluded: Microcephaly (HP:0000252)
Individual 9 (MALE; P1Y7M),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.451+1G>A (homozygous),Severe global developmental delay (HP:0011344); Delayed ability to sit (HP:0025336); Intracranial hemorrhage (HP:0002170); Poor head control (HP:0002421); Short stature (HP:0004322); Delayed speech and language development (HP:0000750); Bulbous nose (HP:0000414); Hypotonia (HP:0001252); Hydrocephalus (HP:0000238); Intracerebral periventricular calcifications (HP:0007229); Decreased body weight (HP:0004325); Feeding difficulties (HP:0011968); Posteriorly rotated ears (HP:0000358); Focal-onset seizure (HP:0007359); Narrow forehead (HP:0000341); Thin corpus callosum (HP:0033725); Highly arched eyebrow (HP:0002553); Limb hypertonia (HP:0002509); Microcephaly (HP:0000252); Dilated third ventricle (HP:0007082); Lateral ventricle dilatation (HP:0006956); Abnormal CNS myelination (HP:0011400)
Individual 10 (MALE; n/a),"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)",NM_138961.3:c.115del (homozygous),Lateral ventricle dilatation (HP:0006956); Intracranial hemorrhage (HP:0002170); Splenic cyst (HP:0030423); Cardiomegaly (HP:0001640); Cerebral edema (HP:0002181); Hydrocephalus (HP:0000238); Hydrops fetalis (HP:0001789); Pulmonary hypoplasia (HP:0002089); Hepatic sinusoidal dilatation (HP:0035006); Periventricular leukomalacia (HP:0006970); Cystic hygroma (HP:0000476); Talipes equinovarus (HP:0001762); Dilated third ventricle (HP:0007082); Anteverted nares (HP:0000463); Multifocal cerebral white matter abnormalities (HP:0007052); Atelectasis (HP:0100750); Microretrognathia (HP:0000308); Gliosis (HP:0002171); Tricuspid regurgitation (HP:0005180); Pulmonary artery atresia (HP:0004935); excluded: Abnormal myelination (HP:0012447); excluded: Thin corpus callosum (HP:0033725); excluded: Microcephaly (HP:0000252)


In [37]:
Individual.output_individuals_as_phenopackets(individual_list=individuals,
                                              metadata=metadata)

We output 14 GA4GH phenopackets to the directory phenopackets


# Output an HPO aggregate annotation file
First collect counts of onset

In [38]:
PMID = metadata.get_pmid()
created_by = metadata.get_created_by()
ppkt_list = [i.to_ga4gh_phenopacket(metadata=metadata) for i in individuals]
builder = HpoaTableBuilder(phenopacket_list=ppkt_list)
#builder.neonatal_onset(PMID,6,13).antenatal_onset(PMID,3,13).third_trimester_onset(PMID,2,13).second_trimester_onset(PMID,2,13)
builder.autosomal_recessive(PMID)
hpoa_creator = builder.build()

We found a total of 88 unique HPO terms
Extracted disease: Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity (OMIM:620371)


In [39]:
df = hpoa_creator.get_dataframe()
df

Unnamed: 0,#diseaseID,diseaseName,phenotypeID,phenotypeName,onsetID,onsetName,frequency,sex,negation,modifier,description,publication,evidence,biocuration
0,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0011344,Severe global developmental delay,,,9/9,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
1,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0000573,Retinal hemorrhage,,,2/2,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
2,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0002170,Intracranial hemorrhage,,,10/10,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
3,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0000750,Delayed speech and language development,,,9/9,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
4,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0000414,Bulbous nose,,,5/5,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
86,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0034295,Reduced cerebral white matter volume,,,1/1,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
87,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0007109,Periventricular cysts,,,1/1,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
88,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0003623,Neonatal onset,,,6/13,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155
89,OMIM:620371,"Neurodevelopmental disorder with intracranial hemorrhage, seizures, and spasticity",HP:0030674,Antenatal onset,,,7/13,,,,,PMID:36996813,PCS,ORCID:0000-0002-5648-2155


In [40]:
hpoa_creator.write_data_frame()

Wrote HPOA disease file to OMIM-620371.tab
