# SLC4A1 Cryohydrocytosis 	Individuals
See [OMIM:185020](https://omim.org/entry/185020).

In [1]:
import pandas as pd
from IPython.display import display, HTML
pd.set_option('display.max_colwidth', None) # show entire column contents, important!
from collections import defaultdict
from pyphetools.creation import *
from pyphetools.visualization import IndividualTable, QcVisualizer
from pyphetools.validation import *
import pyphetools
print(f"Using pyphetools version {pyphetools.__version__}")

Using pyphetools version 0.9.34


In [2]:
parser = HpoParser(hpo_json_file="../hp.json")
hpo_cr = parser.get_hpo_concept_recognizer()
hpo_version = parser.get_version()
hpo_ontology = parser.get_ontology()
created_by="ORCID:0000-0002-0736-9199"
print(f"HPO version {hpo_version}")

HPO version 2024-01-16


In [3]:
df = pd.read_excel("input/slc4a1_cryohydrosis_individuals.xlsx")
df.head()

Unnamed: 0,PMID,title,individual_id,Comment,disease_id,disease_label,transcript,allele_1,allele_2,variant.comment,...,Stomatocytosis,Anisocytosis,Microcytic anemia,Increased red cell osmotic fragility,Reticulocytosis,Hypersplenism,Paroxysmal vertigo,Chronic fatigue,Pseudohyperkalemia,Increased mean corpuscular hemoglobin concentration
0,str,str,str,optional str,str,str,str,HGVS str,HGVS str,optional str,...,HP:0004446,HP:0011273,HP:0001935,HP:0005502,HP:0001923,HP:0001971,HP:0010532,HP:0012432,HP:4000194,HP:0025548
1,PMID:20015879,Cryohydrocytosis: increased activity of cation carriers in red cells from a patient with a band 3 mutation,Patient,,OMIM:185020,Cryohydrocytosis,NM_000342.4,c.2201A>G,na,mutation H734R,...,observed,observed,observed,observed,observed,observed,observed,observed,,


In [4]:
from pyphetools.creation import CaseTemplateEncoder
encoder = CaseTemplateEncoder(df=df, hpo_cr=hpo_cr, created_by=created_by)

Created encoders for 25 fields


In [5]:
individuals = encoder.get_individuals()

In [6]:
vmanager = VariantManager(df=df,
                          individual_column_name="individual_id",
                          cohort_name="SLC4A1",
                          transcript="NM_000342.4",
                          allele_1_column_name="allele_1")

[INFO] encoding variant "c.2201A>G"
https://rest.variantvalidator.org/VariantValidator/variantvalidator/hg38/NM_000342.4%3Ac.2201A>G/NM_000342.4?content-type=application%2Fjson


In [7]:
vmanager.add_variants_to_individuals(individuals)

In [8]:
cvalidator = CohortValidator(cohort=individuals, ontology=hpo_ontology, min_hpo=1, allelic_requirement=AllelicRequirement.MONO_ALLELIC)
qc = QcVisualizer(cohort_validator=cvalidator)
display(HTML(qc.to_summary_html()))

In [9]:
individuals = cvalidator.get_error_free_individual_list()
table = IndividualTable(individuals)
display(HTML(table.to_html()))

Individual,Disease,Genotype,Phenotypic features
Patient (MALE; ),Cryohydrocytosis (OMIM:185020),NM_000342.4:c.2201A>G (heterozygous),Hemolytic anemia (HP:0001878); Stomatocytosis (HP:0004446); Anisocytosis (HP:0011273); Microcytic anemia (HP:0001935); Increased red cell osmotic fragility (HP:0005502); Reticulocytosis (HP:0001923); Hypersplenism (HP:0001971); Paroxysmal vertigo (HP:0010532); Chronic fatigue (HP:0012432); excluded: Coombs-positive hemolytic anemia (HP:0004844)


In [10]:
encoder.output_individuals_as_phenopackets(individual_list=individuals)

We output 1 GA4GH phenopackets to the directory phenopackets
