# TBX5 Cohort

Pathogenic variants in TBX5 are observed in [Holt Oram syndrome](https://omim.org/entry/142900)

In [1]:
import pandas as pd
from IPython.display import display, HTML
pd.set_option('display.max_colwidth', None) 
from collections import defaultdict
from pyphetools.creation import *
from pyphetools.visualization import *
from pyphetools.validation import *
import pyphetools
print(f"Using pyphetools version {pyphetools.__version__}")

Using pyphetools version 0.9.42


In [2]:
parser = HpoParser(hpo_json_file="../hp.json")
hpo_cr = parser.get_hpo_concept_recognizer()
hpo_version = parser.get_version()
hpo_ontology = parser.get_ontology()
created_by="ORCID:0000-0002-0736-9199"
print(f"HPO version {hpo_version}")

HPO version 2024-01-16


In [3]:
df = pd.read_excel("input/tbx5_individuals.xlsx")
df.head(2)

Unnamed: 0,PMID,title,individual_id,Comment,disease_id,disease_label,transcript,allele_1,variant.comment,age_of_onset,...,Absent thumb,Short thumb,Triphalangeal thumb,Absent radius,Hypoplasia of the radius,Hypoplasia of the ulna,Short humerus,Left ventricular noncompaction cardiomyopathy,Upper limb phocomelia,Miscellaneous
0,str,str,str,optional str,str,str,str,HGVS str,optional str,iso8601,...,HP:0009777,HP:0009778,HP:0001199,HP:0003974,HP:0002984,HP:0003022,HP:0005792,HP:0011664,HP:0009813,Miscellaneous HPO terms
1,PMID:28434921,Identification of a novel and functional mutation in the TBX5 gene in a patient by screening from 354 patients with isolated ventricular septal defect,a 6-month-old female,,OMIM:142900,Holt-Oram syndrome,NM_181486.4,c.40C>A,NM_181486.4:c.40C>A,P0D,...,excluded,excluded,excluded,excluded,,,,,excluded,


In [4]:
from pyphetools.creation import CaseTemplateEncoder
encoder = CaseTemplateEncoder(df=df, hpo_cr=hpo_cr, created_by=created_by)

Created encoders for 30 fields


In [5]:
encoder = CaseTemplateEncoder(df=df, hpo_cr=hpo_cr, created_by=created_by)

Created encoders for 30 fields


In [6]:
vmanager = VariantManager(df=df,
                          individual_column_name="individual_id",
                          gene_symbol="TBX5",
                          transcript="NM_181486.4",
                          allele_1_column_name="allele_1")

In [7]:
vmanager.to_summary()

Unnamed: 0,status,count,alleles
0,mapped,46,"c.161T>C, c.374delG, c.262A>T, c.215C>A, c.40C>A, c.253C>A, c.100delG , c.145C>A, c.400dup, c.835C>T, c.510+5G>T, c.408C>A, c.106_107insC, c.709C>T, c.584G>C, c.710G>A, c.281T>G, c.148-1G>C, c.781A>T , c.426dup, c.668C>T, c.361T>G, c.316A>G, c.416del, c.710G>C, c.241A>T, c.678G>T, c.100dup, c.456del, c.194del, c.798delA, c.222G>C, c.658_660del, c.587C>G, c.939del, c.451C>T, c.880G>T, c.641del, c.1333del, c.1024del, c.1304del, c.755+2T>C, c.1366C>T, c.755+1G>A, c.873C>A, c.504del"
1,unmapped,0,


In [8]:
individuals = encoder.get_individuals()
vmanager.add_variants_to_individuals(individuals)
cvalidator = CohortValidator(cohort=individuals, ontology=hpo_ontology, min_hpo=1, allelic_requirement=AllelicRequirement.MONO_ALLELIC)
qc = QcVisualizer(cohort_validator=cvalidator)
display(HTML(qc.to_summary_html()))

Level,Error category,Count
WARNING,REDUNDANT,144


In [9]:
individuals = cvalidator.get_error_free_individual_list()
table = IndividualTable(individuals)
display(HTML(table.to_html()))

Individual,Disease,Genotype,Phenotypic features
a 6-month-old female (FEMALE; P0D),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.40C>A (heterozygous),P9M: Pulmonary arterial hypertension (HP:0002092) Perimembranous ventricular septal defect (HP:0011682); excluded: Secundum atrial septal defect (HP:0001684); excluded: Muscular ventricular septal defect (HP:0011623); excluded: Complete atrioventricular canal defect (HP:0001674); excluded: Patent foramen ovale (HP:0001655); excluded: Absent thumb (HP:0009777); excluded: Short thumb (HP:0009778); excluded: Triphalangeal thumb (HP:0001199); excluded: Absent radius (HP:0003974); excluded: Upper limb phocomelia (HP:0009813)
K1:II-2 (UNKNOWN; ),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.456del (heterozygous),Atrial septal defect (HP:0001631); Absent thumb (HP:0009777); Absent radius (HP:0003974); excluded: Muscular ventricular septal defect (HP:0011623); excluded: Perimembranous ventricular septal defect (HP:0011682); excluded: Complete atrioventricular canal defect (HP:0001674); excluded: Patent foramen ovale (HP:0001655); excluded: Short thumb (HP:0009778); excluded: Triphalangeal thumb (HP:0001199); excluded: Hypoplasia of the radius (HP:0002984); excluded: Hypoplasia of the ulna (HP:0003022); excluded: Short humerus (HP:0005792); excluded: Upper limb phocomelia (HP:0009813)
K2:I-1 (UNKNOWN; ),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.100del (heterozygous),Absent thumb (HP:0009777); Hypoplasia of the radius (HP:0002984); Hypoplasia of the ulna (HP:0003022); Short humerus (HP:0005792); excluded: Secundum atrial septal defect (HP:0001684); excluded: Muscular ventricular septal defect (HP:0011623); excluded: Perimembranous ventricular septal defect (HP:0011682); excluded: Complete atrioventricular canal defect (HP:0001674); excluded: Patent foramen ovale (HP:0001655); excluded: Short thumb (HP:0009778); excluded: Triphalangeal thumb (HP:0001199); excluded: Absent radius (HP:0003974); excluded: Upper limb phocomelia (HP:0009813)
K2:II-1 (UNKNOWN; ),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.100del (heterozygous),Secundum atrial septal defect (HP:0001684); Muscular ventricular septal defect (HP:0011623); Absent thumb (HP:0009777); Hypoplastic scapulae (HP:0000882); excluded: Perimembranous ventricular septal defect (HP:0011682); excluded: Complete atrioventricular canal defect (HP:0001674); excluded: Patent foramen ovale (HP:0001655); excluded: Short thumb (HP:0009778); excluded: Triphalangeal thumb (HP:0001199); excluded: Absent radius (HP:0003974); excluded: Hypoplasia of the radius (HP:0002984); excluded: Hypoplasia of the ulna (HP:0003022); excluded: Upper limb phocomelia (HP:0009813)
K2:II-2 (UNKNOWN; ),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.100del (heterozygous),Muscular ventricular septal defect (HP:0011623); Complete atrioventricular canal defect (HP:0001674); Absent thumb (HP:0009777); Short thumb (HP:0009778); Absent radius (HP:0003974); excluded: Secundum atrial septal defect (HP:0001684); excluded: Perimembranous ventricular septal defect (HP:0011682); excluded: Patent foramen ovale (HP:0001655); excluded: Triphalangeal thumb (HP:0001199); excluded: Upper limb phocomelia (HP:0009813)
K3:II-1 (UNKNOWN; ),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.100dup (heterozygous),Secundum atrial septal defect (HP:0001684); Muscular ventricular septal defect (HP:0011623); Perimembranous ventricular septal defect (HP:0011682); Complete atrioventricular canal defect (HP:0001674); Absent thumb (HP:0009777); Absent radius (HP:0003974); Ulnar deviation of thumb (HP:0006156); excluded: Patent foramen ovale (HP:0001655); excluded: Triphalangeal thumb (HP:0001199); excluded: Upper limb phocomelia (HP:0009813)
K4:I-2 (UNKNOWN; ),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.361T>G (heterozygous),Atrial septal defect (HP:0001631); Hypoplasia of the radius (HP:0002984); excluded: Muscular ventricular septal defect (HP:0011623); excluded: Perimembranous ventricular septal defect (HP:0011682); excluded: Complete atrioventricular canal defect (HP:0001674); excluded: Patent foramen ovale (HP:0001655); excluded: Absent thumb (HP:0009777); excluded: Short thumb (HP:0009778); excluded: Triphalangeal thumb (HP:0001199); excluded: Absent radius (HP:0003974); excluded: Hypoplasia of the ulna (HP:0003022); excluded: Short humerus (HP:0005792); excluded: Upper limb phocomelia (HP:0009813)
K4:II-1 (UNKNOWN; ),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.361T>G (heterozygous),Atrial septal defect (HP:0001631); Hypoplasia of the radius (HP:0002984); Narrow chest (HP:0000774); excluded: Muscular ventricular septal defect (HP:0011623); excluded: Perimembranous ventricular septal defect (HP:0011682); excluded: Complete atrioventricular canal defect (HP:0001674); excluded: Patent foramen ovale (HP:0001655); excluded: Absent thumb (HP:0009777); excluded: Short thumb (HP:0009778); excluded: Triphalangeal thumb (HP:0001199); excluded: Absent radius (HP:0003974); excluded: Hypoplasia of the ulna (HP:0003022); excluded: Short humerus (HP:0005792); excluded: Upper limb phocomelia (HP:0009813)
K4:III-2 (UNKNOWN; ),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.361T>G (heterozygous),Atrial septal defect (HP:0001631); Short thumb (HP:0009778); Hypoplasia of the radius (HP:0002984); excluded: Muscular ventricular septal defect (HP:0011623); excluded: Perimembranous ventricular septal defect (HP:0011682); excluded: Complete atrioventricular canal defect (HP:0001674); excluded: Patent foramen ovale (HP:0001655); excluded: Absent thumb (HP:0009777); excluded: Triphalangeal thumb (HP:0001199); excluded: Absent radius (HP:0003974); excluded: Upper limb phocomelia (HP:0009813)
K4:III-3 (UNKNOWN; ),Holt-Oram syndrome (OMIM:142900),NM_181486.4:c.361T>G (heterozygous),Hypoplasia of the radius (HP:0002984); excluded: Patent foramen ovale (HP:0001655); excluded: Absent thumb (HP:0009777); excluded: Short thumb (HP:0009778); excluded: Triphalangeal thumb (HP:0001199); excluded: Absent radius (HP:0003974); excluded: Upper limb phocomelia (HP:0009813)


In [10]:
encoder.output_individuals_as_phenopackets(individual_list=individuals)

We output 103 GA4GH phenopackets to the directory phenopackets


In [11]:
builder = HpoaTableBuilder.from_individuals(individuals, created_by=created_by)
pmid = "PMID:12789647"
builder.congenital_onset(pmid,40,40)
builder.autosomal_dominant(pmid)
hpoa_creator = builder.build()

We found a total of 72 unique HPO terms
Extracted disease: Holt-Oram syndrome (OMIM:142900)


In [13]:
df = hpoa_creator.get_dataframe()
df.head(40)

Unnamed: 0,#diseaseID,diseaseName,phenotypeID,phenotypeName,onsetID,onsetName,frequency,sex,negation,modifier,description,publication,evidence,biocuration
0,OMIM:142900,Holt-Oram syndrome,HP:0011682,Perimembranous ventricular septal defect,,,1/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199
1,OMIM:142900,Holt-Oram syndrome,HP:0001684,Secundum atrial septal defect,,,0/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199
2,OMIM:142900,Holt-Oram syndrome,HP:0011623,Muscular ventricular septal defect,,,0/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199
3,OMIM:142900,Holt-Oram syndrome,HP:0001674,Complete atrioventricular canal defect,,,0/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199
4,OMIM:142900,Holt-Oram syndrome,HP:0001655,Patent foramen ovale,,,0/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199
5,OMIM:142900,Holt-Oram syndrome,HP:0009777,Absent thumb,,,0/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199
6,OMIM:142900,Holt-Oram syndrome,HP:0009778,Short thumb,,,0/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199
7,OMIM:142900,Holt-Oram syndrome,HP:0001199,Triphalangeal thumb,,,0/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199
8,OMIM:142900,Holt-Oram syndrome,HP:0003974,Absent radius,,,0/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199
9,OMIM:142900,Holt-Oram syndrome,HP:0009813,Upper limb phocomelia,,,0/1,,,,,PMID:28434921,PCS,ORCID:0000-0002-0736-9199


In [14]:
hpoa_creator.write_data_frame()

Wrote HPOA disease file to OMIM-142900.tab
