<h1>Retinal Degeneration Associated With RPGRIP1</h1>
<p>Data from <a href="https://pubmed.ncbi.nlm.nih.gov/34722527/" target="__blank">Beryozkin A, et al. Retinal Degeneration Associated With RPGRIP1: A Review of Natural History, Mutation Spectrum, and Genotype-Phenotype Correlation in 228 Patients. Front Cell Dev Biol. 2021 Oct 14;9:746781. doi: 10.3389/fcell.2021.746781. PMID: 34722527; PMCID: PMC8551679.</a>.</p>

In [1]:
import typing
import os

import hpotk
from phenopackets import Phenopacket

In [2]:
fpath_hpo = 'hpo_data/hp.json'
cache_dir = 'annotations'
fpath_phenopackets = 'phenopackets'

In [3]:
from genophenocorr.preprocessing import configure_caching_patient_creator

In [4]:
hpo: hpotk.ontology.Ontology = hpotk.ontology.load.obographs.load_ontology(fpath_hpo)
    
phenotype_creator = configure_caching_patient_creator(hpo, cache_dir=cache_dir)

In [5]:
from genophenocorr.preprocessing import load_phenopacket_folder

In [6]:
patientCohort = load_phenopacket_folder(fpath_phenopackets, phenotype_creator)

Patient 237–523 has unknown alternative variant GNNNN and will not be included.
Patient 79–194 has unknown alternative variant GNNNN and will not be included.
Expected at least one variant per patient, but received none for patient 79–194


In [7]:
patientCohort.list_all_variants()

[('14_21312458_A/-', 25),
 ('14_21312434_deletion', 9),
 ('14_21302531_G/-', 8),
 ('14_21345145_C/T', 8),
 ('14_21325252_G/A', 7),
 ('14_21345140_AAGGCCG/-', 7),
 ('14_21327672_-/T', 6),
 ('14_21303542_C/T', 5),
 ('14_21325265_A/G', 5),
 ('14_21348211_AAAG/-', 4),
 ('14_21326131_C/T', 4),
 ('14_21326545_TTTTTAGTAGAGATGGGATTTCTCCATGTTGGTCAGGCTGGTCTTCAACTCCCGACCTCAGGTGAACCTCCCACCTGAGCCTCCCAAAGTGCTGGGATTACAGACGTGAGCCACCGCGCCTGGCTGAACAAACTTTTTCAAGCTCTGTAATGCTGTCTAGTATCTGTCTTTACTAAAGGCCTGTTGTTTCTTAGTGCATGACTACATAGATATCTGATTATAAACTGAGACCTTAACACTCCCCCATCATTCTCTCACTTCTTTTAAACACTGGACACAAGTTAGAGAGATTTCCACACCAGATCATGACAAACACAAATTTCTTGGATTTTTTTTTTCCTCCCAATGTGGAGCTGAGCTCCATACTGTCTTTCCTAACTTTTATACCTAGGATTGTGGGGGTGTACCAAGAGGGGTCAACTCTTTGACTACAGTCCTGGGAGGGTGAGGTGGGGGTATCCATGTTTTCCTTAGGAAGTGGGGATAGCTGCAGTCAGAAACAACCATATTTAACAAGATTCTGGATGCTCCAGGACATGTATGCAGCTCTCTCCTCAATACAACTGCTTAAAAAAAGGCTGACACTTCTGGACACAACTCCTTTGCCAAACAGGGGAGGCAGTATAAGCCACCTGTTAATCAGTGTTACAAATCAGACATCTGGCATTTCGAAAGAGCCATTTTGCTTAAGTTTT

In [8]:
patientCohort.list_data_by_tx()

{'NM_001377949.1': Counter({'intron_variant': 47,
          'frameshift_variant': 16,
          'splice_acceptor_variant': 7,
          'splice_region_variant': 5,
          'stop_gained': 18,
          'missense_variant': 4,
          'splice_donor_variant': 5,
          'feature_truncation': 4,
          'coding_sequence_variant': 7,
          '5_prime_UTR_variant': 3,
          'inframe_deletion': 1,
          'splice_donor_5th_base_variant': 2,
          'synonymous_variant': 1,
          'splice_polypyrimidine_tract_variant': 1}),
 'NM_001377948.1': Counter({'frameshift_variant': 24,
          'splice_acceptor_variant': 7,
          'missense_variant': 22,
          'splice_region_variant': 5,
          'stop_gained': 30,
          'intron_variant': 9,
          'splice_donor_variant': 7,
          'feature_truncation': 4,
          'coding_sequence_variant': 8,
          '5_prime_UTR_variant': 3,
          'inframe_deletion': 1,
          'splice_donor_5th_base_variant': 3,
     

In [9]:
from genophenocorr.analysis import CohortAnalysis

In [18]:
rec_analysis = CohortAnalysis(patientCohort, 'NM_020366.4', hpo, recessive=True, include_unmeasured=False)

In [19]:
from genophenocorr.constants import VariantEffect
from genophenocorr.model import FeatureType

In [20]:
rec_analysis.compare_by_variant_type(VariantEffect.FRAMESHIFT_VARIANT)

Divide by 0 error with HPO HP:0000662, not included in this analysis.


Unnamed: 0_level_0,Homozygous frameshift_variant,Homozygous frameshift_variant,Heterozygous frameshift_variant,Heterozygous frameshift_variant,No frameshift_variant,No frameshift_variant,Unnamed: 7_level_0,Unnamed: 8_level_0
Unnamed: 0_level_1,Count,Percent,Count,Percent,Count,Percent,p-value,Corrected p-values
HP:0001483 (Eye poking),21,84.00%,2,100.00%,5,41.67%,0.024229,0.096914
HP:0012758 (Neurodevelopmental delay),8,11.94%,0,0.00%,4,3.31%,0.038327,0.153306
HP:0000613 (Photophobia),12,100.00%,2,100.00%,16,100.00%,1.0,1.0
HP:0000496 (Abnormality of eye movement),32,100.00%,9,100.00%,50,100.00%,1.0,1.0


In [14]:
dom_analysis = CohortAnalysis(patientCohort,'NM_020366.4', hpo, include_unmeasured=False)

In [15]:
dom_analysis.compare_by_variant_type(VariantEffect.FRAMESHIFT_VARIANT)

Unnamed: 0_level_0,With frameshift_variant,With frameshift_variant,Without frameshift_variant,Without frameshift_variant,Unnamed: 5_level_0,Unnamed: 6_level_0
Unnamed: 0_level_1,Count,Percent,Count,Percent,p-value,Corrected p-values
HP:0001483 (Eye poking),23,85.19%,5,41.67%,0.016983,0.084915
HP:0012758 (Neurodevelopmental delay),8,8.99%,4,3.31%,0.129644,0.648221
HP:0000613 (Photophobia),14,100.00%,16,100.00%,1.0,1.0
HP:0000662 (Nyctalopia),3,100.00%,3,100.00%,1.0,1.0
HP:0000496 (Abnormality of eye movement),41,100.00%,50,100.00%,1.0,1.0


In [16]:
dom_analysis.compare_by_variant('14_21312458_A/-')

Divide by 0 error with HPO HP:0000662, not included in this analysis.


Unnamed: 0_level_0,With 14_21312458_A/-,With 14_21312458_A/-,Without 14_21312458_A/-,Without 14_21312458_A/-,Unnamed: 5_level_0,Unnamed: 6_level_0
Unnamed: 0_level_1,Count,Percent,Count,Percent,p-value,Corrected p-values
HP:0001483 (Eye poking),16,100.00%,12,52.17%,0.000919,0.003677
HP:0012758 (Neurodevelopmental delay),4,16.00%,8,4.32%,0.040263,0.161052
HP:0000613 (Photophobia),5,100.00%,25,100.00%,1.0,1.0
HP:0000496 (Abnormality of eye movement),16,100.00%,75,100.00%,1.0,1.0
