# SLC45A2
[Albinism type IV (OCA4)](https://omim.org/entry/606574) is caused by homozygous or compound heterozygous mutation SLC45A2.

In [1]:
import gpsea
import hpotk

store = hpotk.configure_ontology_store()
hpo = store.load_minimal_hpo(release='v2023-10-09')
print(f'Loaded HPO v{hpo.version}')
print(f"Using genophenocorr version {gpsea.__version__}")

Loaded HPO v2023-10-09
Using genophenocorr version 0.6.1.dev0


# SLC45A2
We user the [Matched Annotation from NCBI and EMBL-EBI (MANE)](https://www.ncbi.nlm.nih.gov/refseq/MANE/) transcript and the corresponding protein identifier for SLC45A2.

In [2]:
gene_symbol = 'SLC45A2'
mane_tx_id = 'NM_016180.5'
mane_protein_id = "NP_057264.4" #membrane-associated transporter protein isoform

In [3]:
from ppktstore.registry import configure_phenopacket_registry
from gpsea.preprocessing import configure_caching_cohort_creator, load_phenopackets

from ppktstore.registry import configure_phenopacket_registry
phenopacket_registry = configure_phenopacket_registry()
with phenopacket_registry.open_phenopacket_store("0.1.20") as ps:
    phenopackets = tuple(ps.iter_cohort_phenopackets(gene_symbol))
len(phenopackets)


cohort_creator = configure_caching_cohort_creator(hpo)
cohort, validation = load_phenopackets(
    phenopackets=phenopackets, 
    cohort_creator=cohort_creator,
)

validation.summarize()

Individuals Processed: 100%|██████████| 30/30 [00:00<00:00, 36.33individuals/s]
Validated under permissive policy


In [None]:
from gpsea.view import CohortViewer
cv = CohortViewer(hpo=hpo)
cv.process(cohort=cohort, transcript_id=mane_tx_id)

HPO Term,ID,Seen in n individuals
Hypopigmentation of hair,HP:0005599,30
White eyelashes,HP:0002227,29
White eyebrow,HP:0002226,29
Nystagmus,HP:0000639,28
Iris hypopigmentation,HP:0007730,28
Reduced visual acuity,HP:0007663,26
Hypoplasia of the fovea,HP:0007750,26
Iris transillumination defect,HP:0012805,24
Melanocytic nevus,HP:0000995,12
Nevus,HP:0003764,10

Count,Variant key,Variant Name,Protein Variant,Variant Class
12,5_33954406_33954407_TG_T,c.986del,p.Thr329LysfsTer69,FRAMESHIFT_VARIANT
4,5_33944770_33944770_C_T,c.1471G>A,p.Gly491Arg,MISSENSE_VARIANT
3,5_33947363_33947365_CTT_C,c.1166_1167del,p.Lys389SerfsTer55,FRAMESHIFT_VARIANT
2,5_33944709_33944709_G_T,c.1532C>A,p.Ala511Glu,MISSENSE_VARIANT
2,5_33947257_33947258_AG_A,c.1273del,p.Leu425TrpfsTer9,FRAMESHIFT_VARIANT
2,5_33944734_33944735_TC_T,c.1506del,p.Thr503ProfsTer6,FRAMESHIFT_VARIANT
2,5_33944723_33944723_G_A,c.1518C>T,p.Val506=,SYNONYMOUS_VARIANT
2,5_33954363_33954365_GGC_G,c.1028_1029del,p.Gly343AlafsTer10,FRAMESHIFT_VARIANT
2,5_33951674_33951674_C_A,c.1036G>T,p.Val346Leu,MISSENSE_VARIANT
2,5_33984325_33984326_CG_C,c.258del,p.Val87TrpfsTer26,FRAMESHIFT_VARIANT

Disease Name,Disease ID,Annotation Count
"Albinism, oculocutaneous, type IV",OMIM:606574,30

Variant effect,Annotation Count,Percent
FRAMESHIFT_VARIANT,26,48%
MISSENSE_VARIANT,21,39%
SYNONYMOUS_VARIANT,2,4%
SPLICE_REGION_VARIANT,1,2%
SPLICE_POLYPYRIMIDINE_TRACT_VARIANT,1,2%
INTRON_VARIANT,1,2%
TRANSCRIPT_ABLATION,1,2%
STOP_GAINED,1,2%


In [7]:
# Note we do not show the strcture because no domains/motifs are shown in UniProt (Q9UMX9).

In [8]:
from gpsea.view import CohortVariantViewer

viewer = CohortVariantViewer(tx_id=mane_tx_id)
viewer.process(cohort)

Variant key,Variant (cDNA),Variant (protein),Overlapping Exons,Effects,Count
5_33954406_33954407_TG_T,c.986del,p.Thr329LysfsTer69,4.0,frameshift,12
5_33944770_33944770_C_T,c.1471G>A,p.Gly491Arg,7.0,missense,4
5_33947363_33947365_CTT_C,c.1166_1167del,p.Lys389SerfsTer55,6.0,frameshift,3
5_33947257_33947258_AG_A,c.1273del,p.Leu425TrpfsTer9,6.0,frameshift,2
5_33944709_33944709_G_T,c.1532C>A,p.Ala511Glu,7.0,missense,2
5_33984325_33984326_CG_C,c.258del,p.Val87TrpfsTer26,1.0,frameshift,2
5_33944723_33944723_G_A,c.1518C>T,p.Val506=,7.0,synonymous,2
5_33954443_33954443_T_C,c.950A>G,p.Tyr317Cys,4.0,missense,2
5_33954363_33954365_GGC_G,c.1028_1029del,p.Gly343AlafsTer10,4.0,frameshift,2
5_33951674_33951674_C_A,c.1036G>T,p.Val346Leu,5.0,missense,2


In [9]:
from gpsea.analysis.predicate.phenotype import prepare_predicates_for_terms_of_interest

pheno_predicates = prepare_predicates_for_terms_of_interest(
    cohort=cohort,
    hpo=hpo,
)
len(pheno_predicates)
from gpsea.analysis.mtc_filter import HpoMtcFilter
mtc_filter = HpoMtcFilter.default_filter( hpo=hpo)
mtc_correction = 'fdr_bh'
mtc_alpha = 0.05
from gpsea.analysis.pcats.stats import FisherExactTest

count_statistic = FisherExactTest()
from gpsea.analysis.pcats import HpoTermAnalysis

analysis = HpoTermAnalysis(
    count_statistic=count_statistic,
    mtc_filter=mtc_filter,
    mtc_correction=mtc_correction,
     mtc_alpha=mtc_alpha,
)

In [10]:
from gpsea.model import VariantEffect
from gpsea.analysis.predicate.genotype import VariantPredicates, biallelic_predicate

missense = VariantPredicates.variant_effect(VariantEffect.MISSENSE_VARIANT, tx_id=mane_tx_id)


gt_predicate = biallelic_predicate(a_predicate=missense, 
                                   b_predicate=~missense, 
                                   a_label="missense",
                                   b_label="other",
                                    partitions=((0,1),(2,))
                                   )
print(gt_predicate.display_question())
result = analysis.compare_genotype_vs_phenotypes(
    cohort=cohort,
    gt_predicate=gt_predicate,
    pheno_predicates=pheno_predicates,
)
from gpsea.view import MtcStatsViewer

viewer = MtcStatsViewer()
viewer.process(result)

Allele group: missense/missense OR missense/other, other/other


Code,Reason,Count
HMF01,Skipping term with maximum frequency that was less than threshold 0.4,2
HMF03,Skipping term because of a child term with the same individual counts,13
HMF08,Skipping general term,19
HMF09,Skipping term with maximum annotation frequency that was less than threshold 0.4,5


In [11]:
from gpsea.view import summarize_hpo_analysis

summarize_hpo_analysis(hpo=hpo, result=result)

Allele group,missense/missense OR missense/other,missense/missense OR missense/other,other/other,other/other,Unnamed: 5_level_0,Unnamed: 6_level_0
Unnamed: 0_level_1,Count,Percent,Count,Percent,Corrected p values,p values
Iris transillumination defect [HP:0012805],13/17,76%,11/11,100%,1.0,0.132357
Esotropia [HP:0000565],4/16,25%,5/10,50%,1.0,0.234117
Heterotropia [HP:0032012],6/18,33%,7/12,58%,1.0,0.264122
Strabismus [HP:0000486],6/18,33%,7/12,58%,1.0,0.264122
Nystagmus [HP:0000639],16/18,89%,12/12,100%,1.0,0.503448
Iris hypopigmentation [HP:0007730],16/18,89%,12/12,100%,1.0,0.503448
Melanocytic nevus [HP:0000995],9/14,64%,3/6,50%,1.0,0.642415
Nevus [HP:0003764],13/18,72%,9/12,75%,1.0,1.0
Localized skin lesion [HP:0011355],13/13,100%,9/9,100%,1.0,1.0
Abnormal iris pigmentation [HP:0008034],17/17,100%,12/12,100%,1.0,1.0
