# HNRPA2B1
Variants in HNRPA2B1 are associated with [Oculopharyngeal muscular dystrophy 2](https://omim.org/entry/620460).

In [1]:
import pandas as pd
pd.set_option('display.max_colwidth', None) # show entire column contents, important!
from IPython.display import HTML, display
from pyphetools.creation import *
from pyphetools.visualization import *
from pyphetools.validation import *
import pyphetools
print(f"pyphetools version {pyphetools.__version__}")

pyphetools version 0.9.64


In [2]:
PMID = "PMID:35484142"
title = "Heterozygous frameshift variants in HNRNPA2B1 cause early-onset oculopharyngeal muscular dystrophy"
cite = Citation(pmid=PMID, title=title)
parser = HpoParser(hpo_json_file="../hp.json")
hpo_cr = parser.get_hpo_concept_recognizer()
hpo_version = parser.get_version()
hpo_ontology = parser.get_ontology()
metadata = MetaData(created_by="ORCID:0000-0002-5648-2155", citation=cite)
metadata.default_versions_with_hpo(version=hpo_version)
print(f"HPO version {hpo_version}")

HPO version 2024-02-27


In [3]:
df = pd.read_excel('input/HNRPA2B1_Kim_2022.xlsx')
df.head(2)

Unnamed: 0,Family/Patient,Ethnicity,Sex,age at last examination (y),allele,Pathogenic HNRNPA2B1 variant,Inheritance,age_of_onset,Onset,Pattern of muscle weakness,CK level U/L
0,F1/P1,Italian/Colombian,M,12,c.992del,"c.992delG, p.(G331Efs*28)",de novo,P2Y,Swallowing difficulties (2 y),"Ptosis, ophthalmoplegia, tongue weakness, dysphonia, symmetric proximal and distal weakness in LE > UE; moderate progression, dysphagia, respiratory insufficiency",724
1,F2/P2,Northern European,M,17,c.981del,"c.981delA, p.(G328Afs*31)",de novo,Neonatal onset,Neonatal feeding difficulties,"Ptosis, ophthalmoplegia, symmetric proximal and distal weakness in LE > UE; moderate progression, dysphagia",602


In [4]:
#res = OptionColumnMapper.autoformat(df=df, hpo_cr=hpo_cr)
#print(res)
column_mapper_list = list()

In [5]:
onset_d = {'Swallowing difficulties (2\u2009y)': 'Dysphagia',
 'Neonatal feeding difficulties': 'Feeding difficulties',
 'Muscle weakness (6\u2009y)': 'Muscle weakness',
 'Ptosis': 'Ptosis',
 'ophthalmoplegia (18\u2009y)': 'Ophthalmoplegia',
 'ophthalmoplegia': 'Ophthalmoplegia',
 'dysphagia (17\u2009y)': 'Dysphagia',
 'Respiratory insufficiency requiring tracheostomy (birth)': 'Respiratory insufficiency',
 'ophthalmoplegia (6 months)': 'Ophthalmoplegia',
 'Delayed motor milestones (infancy)': 'Motor delay',
 'Respiratory illness with acute onset ptosis (18 months)': 'Ptosis',
}
excluded = {}
onsetMapper = OptionColumnMapper(column_name="Onset", concept_recognizer=hpo_cr, option_d=onset_d, excluded_d=excluded)
column_mapper_list.append(onsetMapper)
onsetMapper.preview_column(df)

Unnamed: 0,mapping,count
0,Dysphagia (HP:0002015) (observed),2
1,Feeding difficulties (HP:0011968) (observed),1
2,Muscle weakness (HP:0001324) (observed),1
3,Ptosis (HP:0000508) (observed),4
4,Ophthalmoplegia (HP:0000602) (observed),3
5,Respiratory insufficiency (HP:0002093) (observed),1
6,Motor delay (HP:0001270) (observed),1


In [6]:
pattern_of_muscle_weakness_d = {'Ptosis': 'Ptosis',
 'ophthalmoplegia': 'Ophthalmoplegia',
 'dysphonia': 'Dysphonia',
 'symmetric proximal and distal weakness in LE\u2009>\u2009UE; moderate progression': 'Asthenia',
 'dysphagia': 'Dysphagia',
 'respiratory insufficiency': 'Respiratory insufficiency',
 'symmetric proximal and distal weakness in LE\u2009>\u2009UE; dysphagia': 'Lower limb muscle weakness',
 'asymmetric proximal and distal weakness LE\u2009>\u2009UE; mild progression': 'Lower limb muscle weakness',
 'axial weakness; respiratory insufficiency': 'Axial muscle weakness',
 'loss of independent ambulation (8 years)': 'Loss of ambulation',
 'axial weakness': 'Axial muscle weakness',
 'symmetric proximal UE and LE weakness': 'Limb muscle weakness',
 'symmetric proximal and distal weakness LE\u2009>\u2009UE; moderate/severe progression': 'Limb muscle weakness',
 'symmetric LE\u2009>\u2009UE proximal': 'Proximal muscle weakness in lower limbs',
 'distal and axial weakness; loss of independent ambulation (7 years)': 'Axial muscle weakness',
 'ankle contractures': 'Ankle contracture',
 'symmetric LE\u2009>\u2009UE proximal muscle weakness': 'Proximal muscle weakness'}
excluded = {}
pattern_of_muscle_weaknessMapper = OptionColumnMapper(column_name="Pattern of muscle weakness", concept_recognizer=hpo_cr, option_d=pattern_of_muscle_weakness_d, excluded_d=excluded)
column_mapper_list.append(pattern_of_muscle_weaknessMapper)
pattern_of_muscle_weaknessMapper.preview_column(df)

Unnamed: 0,mapping,count
0,Ptosis (HP:0000508) (observed),11
1,Ophthalmoplegia (HP:0000602) (observed),11
2,Asthenia (HP:0025406) (observed),9
3,Dysphonia (HP:0001618) (observed),5
4,Dysphagia (HP:0002015) (observed),9
5,Respiratory insufficiency (HP:0002093) (observed),9
6,Axial muscle weakness (HP:0003327) (observed),3
7,Loss of ambulation (HP:0002505) (observed),1
8,Limb muscle weakness (HP:0003690) (observed),1
9,Proximal muscle weakness in lower limbs (HP:0008994) (observed),1


In [7]:
ck = Thresholder.creatine_kinase_blood()
ckMapper = ThresholdedColumnMapper(column_name="CK level U/L", thresholder=ck)
ckMapper.preview_column(df)

Unnamed: 0,mapping: 30.0-170.0 U/L,count
0,Elevated circulating creatine kinase concentration (HP:0003236): observed,11


In [8]:
HNRNPA2B1_transcript = "NM_002137.4"

vman = VariantManager(df=df, individual_column_name="Family/Patient", gene_symbol="HNRNPA2B1",
                     transcript=HNRNPA2B1_transcript, allele_1_column_name="allele")

In [9]:
vman.to_summary()

Unnamed: 0,status,count,alleles
0,mapped,9,"c.984del, c.1001_1002dup, c.981del, c.992del, c.996_997dup, c.980_986del, c.1001del, c.974del, c.966del"
1,unmapped,0,


In [10]:
varMapper = VariantColumnMapper(variant_column_name="allele", 
                                variant_d=vman.get_variant_d(),
                                default_genotype="heterozygous")

In [11]:
ageLastEncounterMapper = AgeColumnMapper.by_year(column_name="age at last examination (y)")
#ageLastEncounterMapper.preview_column(df)
ageOnsetMapper = AgeColumnMapper.iso8601(column_name="age_of_onset")
#ageOnsetMapper.preview_column(df)
sexMapper = SexColumnMapper(column_name="Sex", male_symbol="M", female_symbol="F")
#sexMapper.preview_column(df)

In [12]:
OPMD2 = Disease(disease_id='OMIM:620460', disease_label='Oculopharyngeal muscular dystrophy 2')
 	 	
encoder = CohortEncoder(df=df, 
                        hpo_cr=hpo_cr, 
                        column_mapper_list=column_mapper_list, 
                        individual_column_name="Family/Patient", 
                        age_of_onset_mapper=ageOnsetMapper,
                        age_at_last_encounter_mapper=ageLastEncounterMapper,
                        sexmapper=sexMapper,
                        variant_mapper=varMapper,
                        metadata=metadata)
encoder.set_disease(OPMD2)

In [13]:
individuals = encoder.get_individuals()

Could not parse the following as ISO8601 ages: Neonatal onset (n=1), Congenital onset (n=1), Infantile onset (n=1), Childhood onset (n=1)


In [14]:
cvalidator = CohortValidator(cohort=individuals, ontology=hpo_ontology, min_hpo=1, allelic_requirement=AllelicRequirement.MONO_ALLELIC)
qc = QcVisualizer(cohort_validator=cvalidator)
display(HTML(qc.to_summary_html()))

Level,Error category,Count


In [15]:
individuals = cvalidator.get_error_free_individual_list()
table = PhenopacketTable(individual_list=individuals, metadata=metadata)
display(HTML(table.to_html()))

Individual,Disease,Genotype,Phenotypic features
F1/P1 (MALE; P12Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.992del (heterozygous),Ptosis (HP:0000508); Dysphagia (HP:0002015); Respiratory insufficiency (HP:0002093); Asthenia (HP:0025406); Dysphonia (HP:0001618); Ophthalmoplegia (HP:0000602)
F2/P2 (MALE; P17Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.981del (heterozygous),Feeding difficulties (HP:0011968); Ptosis (HP:0000508); Ophthalmoplegia (HP:0000602); Asthenia (HP:0025406); Dysphagia (HP:0002015)
F3/P3 (FEMALE; P17Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.984del (heterozygous),Muscle weakness (HP:0001324); Ptosis (HP:0000508); Ophthalmoplegia (HP:0000602); Dysphonia (HP:0001618); Asthenia (HP:0025406); Dysphagia (HP:0002015)
F4/P4 (FEMALE; P40Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.968del (heterozygous),Dysphagia (HP:0002015); Respiratory insufficiency (HP:0002093); Ophthalmoplegia (HP:0000602); Asthenia (HP:0025406); Ptosis (HP:0000508)
F4/P5 (FEMALE; P43Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.968del (heterozygous),Dysphagia (HP:0002015); Respiratory insufficiency (HP:0002093); Ophthalmoplegia (HP:0000602); Asthenia (HP:0025406); Ptosis (HP:0000508)
F5/P6 (FEMALE; P12Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.1001del (heterozygous),Dysphagia (HP:0002015); Respiratory insufficiency (HP:0002093); Ophthalmoplegia (HP:0000602); Asthenia (HP:0025406); Ptosis (HP:0000508)
F6/P7 (FEMALE; P9Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.996_997dup (heterozygous),Dysphagia (HP:0002015); Respiratory insufficiency (HP:0002093); Loss of ambulation (HP:0002505); Ophthalmoplegia (HP:0000602); Dysphonia (HP:0001618); Axial muscle weakness (HP:0003327); Ptosis (HP:0000508)
F7/P8 (MALE; P20Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.980_986del (heterozygous),Motor delay (HP:0001270); Ptosis (HP:0000508); Ophthalmoplegia (HP:0000602); Dysphonia (HP:0001618); Axial muscle weakness (HP:0003327); Limb muscle weakness (HP:0003690); Respiratory insufficiency (HP:0002093)
F8/P9 (MALE; P35Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.974del (heterozygous),Dysphagia (HP:0002015); Respiratory insufficiency (HP:0002093); Ophthalmoplegia (HP:0000602); Asthenia (HP:0025406); Ptosis (HP:0000508)
F9/P10 (FEMALE; P7Y),Oculopharyngeal muscular dystrophy 2 (OMIM:620460),NM_002137.4:c.996_997dup (heterozygous),Ankle contracture (HP:0034677); Dysphagia (HP:0002015); Respiratory insufficiency (HP:0002093); Ophthalmoplegia (HP:0000602); Proximal muscle weakness in lower limbs (HP:0008994); Dysphonia (HP:0001618); Axial muscle weakness (HP:0003327); Ptosis (HP:0000508)


In [16]:
Individual.output_individuals_as_phenopackets(individual_list=individuals,
                                              metadata=metadata)

We output 11 GA4GH phenopackets to the directory phenopackets


# HPOA file

In [17]:
ingestor = PhenopacketIngestor(indir="phenopackets")
ppkt_d = ingestor.get_phenopacket_dictionary()
ppkt_list = list(ppkt_d.values())

[pyphetools] Ingested 11 GA4GH phenopackets.


In [18]:
builder = HpoaTableBuilder(phenopacket_list=ppkt_list)
builder.autosomal_dominant(PMID)
hpoa_table_creator = builder.build()
df = hpoa_table_creator.get_dataframe()
df.head(20)

We found a total of 15 unique HPO terms
Extracted disease: Oculopharyngeal muscular dystrophy 2 (OMIM:620460)


Unnamed: 0,#diseaseID,diseaseName,phenotypeID,phenotypeName,onsetID,onsetName,frequency,sex,negation,modifier,description,publication,evidence,biocuration
0,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0002015,Dysphagia,,,9/9,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155
1,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0002093,Respiratory insufficiency,,,9/9,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155
2,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0000602,Ophthalmoplegia,,,11/11,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155
3,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0025406,Asthenia,,,7/7,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155
4,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0000508,Ptosis,,,11/11,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155
5,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0003701,Proximal muscle weakness,,,1/1,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155
6,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0011968,Feeding difficulties,,,1/1,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155
7,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0034677,Ankle contracture,,,1/1,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155
8,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0008994,Proximal muscle weakness in lower limbs,,,1/1,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155
9,OMIM:620460,Oculopharyngeal muscular dystrophy 2,HP:0001618,Dysphonia,,,5/5,,,,,PMID:35484142,PCS,ORCID:0000-0002-5648-2155


In [19]:
hpoa_table_creator.write_data_frame()

Wrote HPOA disease file to OMIM-620460.tab
