<h1>KBG Syndrome</h1>
<p>Data from <a href="https://pubmed.ncbi.nlm.nih.gov/36446582/" target="__blank">Martinez-Cayuelas E, et al. Clinical description, molecular delineation and genotype-phenotype correlation in 340 patients with KBG syndrome: addition of 67 new patients. J Med Genet. 2022 Nov 29:jmedgenet-2022-108632. PMID: 36446582.</a>.</p>

In [1]:
import os
import hpotk

In [2]:
from genophenocorr.preprocessing import configure_caching_patient_creator

In [3]:
fpath_hpo = 'hpo_data/hp.json'
cache_dir = 'annotations'
fpath_phenopackets = 'phenopackets'
tx_id = 'NM_013275.6'


In [4]:
hpo: hpotk.ontology.Ontology = hpotk.ontology.load.obographs.load_ontology(fpath_hpo)

In [5]:
pc = configure_caching_patient_creator(hpo, cache_dir = cache_dir)

In [6]:
from genophenocorr.preprocessing import load_phenopacket_folder

In [7]:
patientCohort = load_phenopacket_folder(fpath_phenopackets, pc)

Expected at least one variant per patient, but received none for patient Parenti2016_P1
Expected at least one variant per patient, but received none for patient Low, 2016_P7 (8)
Expected at least one variant per patient, but received none for patient KBG42


In [8]:
from IPython.display import HTML, display
from genophenocorr.view import CohortViewer

viewer = CohortViewer(hpo)

In [9]:
display(HTML(viewer.cohort_summary_table(patientCohort)))

0,1
Item,Description
Total Individuals,340
Excluded Individuals,"11: VanDongen2019_P5;Reuter2020;KBG31B;VanDongen2019_P9;VanDongen2019_P2;VanDongen2019_P4;VanDongen2019_P8;VanDongen2019_P12;VanDongen2019_P7;VanDongen2019_P13;Novara, 2017_P10"
Total Unique HPO Terms,28
Total Unique Variants,326


In [10]:
display(HTML(viewer.hpo_term_counts_table(patientCohort))) ## Add Labels to output

0,1
HPO Term,Count
Abnormality of dental morphology (HP:0006482),224
Abnormality of higher mental function (HP:0011446),220
Intellectual disability (HP:0001249),194
Abnormality of the hand (HP:0001155),189
Neurodevelopmental delay (HP:0012758),176
Short stature (HP:0004322),150
Abnormal external nose morphology (HP:0010938),134
Abnormal eyebrow morphology (HP:0000534),126
Long philtrum (HP:0000343),121


In [11]:
display(HTML(viewer.variants_table(patientCohort, tx_id))) 

[WARN] could not identify a single variant for target transcript (got 0), variant 16_87886395_88066394_DEL
c.1903_1907del - 32
c.2408_2412del - 10
c.1381_1384del - 8
c.2398_2401del - 8
c.7481_7482insC - 5
c.6792_6793insC - 5
c.2197C>T - 3
c.4406G>A - 3
c.1977C>G - 3
c.3224_3227del - 3
c.2175_2178del - 3
c.3832A>T - 3
c.2182_2183del - 3
c.7570-1G>C - 3
c.1367_1370del - 2
c.3045del - 2
c.3590_3594del - 2
c.2329_2332del - 2
c.4384_4385insA - 2
c.3309_3310insA - 2
c.5790C>A - 2
c.6513_6514insC - 2
c.1385_1388del - 2
c.7216C>T - 2
c.1318C>T - 2
c.5488G>T - 2
c.7534C>T - 2
c.3704_3707del - 2
c.4087C>T - 2
c.2512C>T - 1
c.4786G>T - 1
c.3931C>T - 1
c.548_551del - 1
NA - 1
c.3208_3209del - 1
c.2647G>T - 1
c.3974del - 1
c.7411_7422del - 1
c.1460_1463del - 1
c.2395A>T - 1
c.7552C>T - 1
c.4389_4390del - 1
c.6472G>T - 1
c.7470+2T>C - 1
c.915del - 1
c.4529_4530insC - 1
c.4103_4104del - 1
c.5889del - 1
c.5146G>T - 1
c.3888_3889insC - 1
c.7180C>T - 1
c.6184del - 1
c.3382_3383del - 1
c.4408A>T - 1
c.37

0,1,2,3
Variant,Effect,Count,Key
c.1903_1907del,FRAMESHIFT_VARIANT,32,16_89284634_89284639_GTGTTT_G
c.2408_2412del,FRAMESHIFT_VARIANT,10,16_89284129_89284134_CTTTTT_C
c.1381_1384del,FRAMESHIFT_VARIANT,8,16_89285157_89285161_GTTTC_G
c.2398_2401del,FRAMESHIFT_VARIANT,8,16_89284140_89284144_TTTTC_T
c.7481_7482insC,FRAMESHIFT_VARIANT,5,16_89275180_89275181_A_AG
c.6792_6793insC,FRAMESHIFT_VARIANT,5,16_89279749_89279750_C_CG
c.2197C>T,STOP_GAINED,3,16_89284345_89284345_G_A
c.4406G>A,STOP_GAINED,3,16_89282136_89282136_C_T
c.1977C>G,STOP_GAINED,3,16_89284565_89284565_G_C


In [None]:
patientCohort.list_all_patients()

In [None]:
patientCohort.list_all_proteins()

In [None]:
patientCohort.list_data_by_tx('NM_013275.6')

In [None]:
patientCohort.list_data_by_tx()

In [None]:
patientCohort.all_proteins

In [None]:
from genophenocorr.analysis import CohortAnalysis

In [None]:
analysis = CohortAnalysis(patientCohort, 'NM_013275.6', hpo, include_unmeasured=False)

In [None]:
from genophenocorr.model import VariantEffect

In [None]:
VariantEffect.FRAMESHIFT_VARIANT.value

In [None]:
analysis.compare_by_variant_type(VariantEffect.FRAMESHIFT_VARIANT)

In [None]:
analysis.compare_by_variant('16_89284634_89284639_GTGTTT_G')

In [None]:
analysis2 = CohortAnalysis(patientCohort, 'NM_013275.6', hpo, include_unmeasured=False, include_large_SV=False)

analysis2.compare_by_exon(9)

In [None]:
from genophenocorr.model import FeatureType

In [None]:
analysis.compare_by_protein_feature_type(FeatureType.REGION)