<h1>Sulfite Oxidase Deficiency SUOX</h1>
<p>Data from <a href="https://pubmed.ncbi.nlm.nih.gov/36303223/" target="__blank">Li JT, Chen ZX, Chen XJ, Jiang YX. Mutation analysis of SUOX in isolated sulfite oxidase deficiency with ectopia lentis as the presenting feature: insights into genotype-phenotype correlation. Orphanet J Rare Dis. 2022 Oct 27;17(1):392. doi: 10.1186/s13023-022-02544-x. PMID: 36303223; PMCID: PMC9615255.</a></p>

In [1]:
import typing
import os

import hpotk
from phenopackets import Phenopacket

In [2]:
fpath_hpo = 'hpo_data/hp.json'
cache_dir = 'annotations'
fpath_phenopackets = 'phenopackets'

In [3]:
from genophenocorr.preprocessing import configure_caching_patient_creator

In [4]:
hpo: hpotk.ontology.Ontology = hpotk.ontology.load.obographs.load_ontology(fpath_hpo)
    
phenotype_creator = configure_caching_patient_creator(hpo, cache_dir=cache_dir)

In [5]:
from genophenocorr.preprocessing import load_phenopacket_folder

In [6]:
patientCohort = load_phenopacket_folder(fpath_phenopackets, phenotype_creator)

In [7]:
from IPython.display import HTML, display
from genophenocorr.view import CohortViewer

viewer = CohortViewer(hpo)

In [8]:
patientCohort.list_all_variants(10)

[('12_56004589_56004589_C_G', 7),
 ('12_56004039_56004039_G_A', 3),
 ('12_56004485_56004485_C_T', 3),
 ('12_56004765_56004765_G_A', 3),
 ('12_56004905_56004909_ATTGT_A', 2),
 ('12_56004933_56004959_A_ACAATGTGCAGCCAGACACCGTGGCCC', 2),
 ('12_56004771_56004771_A_T', 2),
 ('12_56004273_56004273_G_A', 2),
 ('12_56004192_56004192_G_A', 1),
 ('12_56004161_56004161_A_C', 1)]

In [9]:
patientCohort.list_all_phenotypes()

[('HP:0001250', 28),
 ('HP:0001252', 15),
 ('HP:0001276', 11),
 ('HP:0002071', 11),
 ('HP:0000252', 10),
 ('HP:0012758', 8),
 ('HP:0001083', 7),
 ('HP:0034332', 6)]

In [10]:
patientCohort.list_data_by_tx()

{'NM_001032386.2': Counter({'MISSENSE_VARIANT': 29,
          'FRAMESHIFT_VARIANT': 9,
          'STOP_GAINED': 10}),
 'NM_000456.3': Counter({'MISSENSE_VARIANT': 29,
          'FRAMESHIFT_VARIANT': 9,
          'STOP_GAINED': 10}),
 'NM_001032387.2': Counter({'MISSENSE_VARIANT': 29,
          'FRAMESHIFT_VARIANT': 9,
          'STOP_GAINED': 10})}

In [11]:
len(patientCohort.list_all_patients())

35

In [20]:
from genophenocorr.analysis import CohortAnalysis
from genophenocorr.model import VariantEffect

In [21]:
analysis = CohortAnalysis(patientCohort, 'NM_000456.3', hpo, include_unmeasured=False, 
                          recessive=True, p_val_correction='fdr_bh')

In [22]:
analysis.compare_by_variant_type(VariantEffect.MISSENSE_VARIANT)

Unnamed: 0_level_0,Homozygous missense_variant,Homozygous missense_variant,Heterozygous missense_variant,Heterozygous missense_variant,No missense_variant,No missense_variant,Unnamed: 7_level_0,Unnamed: 8_level_0
Unnamed: 0_level_1,Count,Percent,Count,Percent,Count,Percent,p-value,Corrected p-values
HP:0034332 (Cognitive regression),6,50.00%,0,0.00%,0,0.00%,0.023343,0.158119
HP:0001252 (Hypotonia),10,90.91%,2,40.00%,3,42.86%,0.03953,0.158119
HP:0001250 (Seizure),12,66.67%,5,83.33%,11,100.00%,0.08264,0.220373
HP:0002071 (Abnormality of extrapyramidal motor function),8,66.67%,1,20.00%,2,25.00%,0.139377,0.242998
HP:0012758 (Neurodevelopmental delay),4,33.33%,0,0.00%,4,50.00%,0.151874,0.242998
HP:0001083 (Ectopia lentis),3,27.27%,3,75.00%,1,33.33%,0.334276,0.445701
HP:0000252 (Microcephaly),4,40.00%,2,50.00%,4,57.14%,0.849964,0.971388
HP:0001276 (Hypertonia),5,45.45%,2,40.00%,4,57.14%,1.0,1.0


In [19]:
analysis.compare_by_variant('12_56004589_56004589_C_G')

Unnamed: 0_level_0,Homozygous 12_56004589_56004589_C_G,Homozygous 12_56004589_56004589_C_G,Heterozygous 12_56004589_56004589_C_G,Heterozygous 12_56004589_56004589_C_G,No 12_56004589_56004589_C_G,No 12_56004589_56004589_C_G,Unnamed: 7_level_0,Unnamed: 8_level_0
Unnamed: 0_level_1,Count,Percent,Count,Percent,Count,Percent,p-value,Corrected p-values
HP:0001252 (Hypotonia),0,0.00%,1,25.00%,14,77.78%,0.032869,0.26295
HP:0001083 (Ectopia lentis),0,0.00%,2,100.00%,5,33.33%,0.137255,0.468687
HP:0012758 (Neurodevelopmental delay),0,0.00%,0,0.00%,8,42.11%,0.175758,0.468687
HP:0002071 (Abnormality of extrapyramidal motor function),0,0.00%,1,20.00%,10,52.63%,0.34058,0.681159
HP:0034332 (Cognitive regression),0,0.00%,0,0.00%,6,31.58%,0.452851,0.724562
HP:0001276 (Hypertonia),1,100.00%,1,25.00%,9,50.00%,0.590062,0.786749
HP:0000252 (Microcephaly),1,100.00%,1,33.33%,8,47.06%,1.0,1.0
HP:0001250 (Seizure),2,100.00%,4,80.00%,22,78.57%,1.0,1.0
