# KnownCancer Annotation Test

Simple test of the KnownCancer method with filtered cancer annotations.


In [1]:
import sys
import pandas as pd
from pathlib import Path
import logging

# Add src to path
sys.path.insert(0, '../../src')

from pyMut.annotate.cosmic_cancer_annotate import knownCancer

# Suppress verbose logging
logging.getLogger().setLevel(logging.WARNING)


In [2]:
# Define file paths
maf_file = Path("../../src/pyMut/data/examples/tcga_laml.maf.gz")
cosmic_file = Path(
    "../../src/pyMut/data/resources/Cosmic_CancerGeneCensus_Tsv_v102_GRCh38/Cosmic_CancerGeneCensus_v102_GRCh38.tsv.gz")
oncokb_file = Path("../../src/pyMut/data/resources/OncoKb/cancerGeneList.tsv")


In [3]:
# Run KnownCancer annotation
result_df, output_path = knownCancer(
    maf_file=maf_file,
    annotation_table=cosmic_file,
    oncokb_table=oncokb_file,
)


In [4]:
# Display only Hugo_Symbol and KnownCancer annotations
knowncancer_columns = [
    "COSMIC_ROLE_IN_CANCER",
    "COSMIC_TIER",
    "OncoKB_Is Oncogene",
    "OncoKB_Is Tumor Suppressor Gene",
    "OncoKB_OncoKB Annotated",
    "OncoKB_MSK-IMPACT",
    "OncoKB_MSK-HEME",
    "OncoKB_FOUNDATION ONE",
    "OncoKB_FOUNDATION ONE HEME",
    "OncoKB_Vogelstein",
    "Is_Oncogene_any"
]

# Filter to show only Hugo_Symbol and available KnownCancer annotation columns and Is_Oncogene_any = True
display_columns = ["Hugo_Symbol"] + [col for col in knowncancer_columns if col in result_df.columns]
result_df = result_df[result_df["Is_Oncogene_any"] == True]
result_df[display_columns]


Unnamed: 0,Hugo_Symbol,COSMIC_ROLE_IN_CANCER,COSMIC_TIER,OncoKB_Is Oncogene,OncoKB_Is Tumor Suppressor Gene,OncoKB_OncoKB Annotated,OncoKB_MSK-IMPACT,OncoKB_MSK-HEME,OncoKB_FOUNDATION ONE,OncoKB_FOUNDATION ONE HEME,OncoKB_Vogelstein,Is_Oncogene_any
8,ABL1,"oncogene, fusion",1.0,Yes,No,Yes,Yes,Yes,Yes,Yes,Yes,True
40,AFF4,"oncogene, fusion",1.0,Yes,No,Yes,No,No,No,Yes,No,True
58,ALOX5,,,Yes,Yes,Yes,No,No,No,No,No,True
70,ANKRD26,,,Yes,No,Yes,No,No,No,No,No,True
91,ARHGAP5,oncogene,2.0,,,,,,,,,True
...,...,...,...,...,...,...,...,...,...,...,...,...
2145,WT1,"oncogene, TSG, fusion",1.0,Yes,Yes,Yes,Yes,Yes,Yes,Yes,Yes,True
2146,WT1,"oncogene, TSG, fusion",1.0,Yes,Yes,Yes,Yes,Yes,Yes,Yes,Yes,True
2147,WT1,"oncogene, TSG, fusion",1.0,Yes,Yes,Yes,Yes,Yes,Yes,Yes,Yes,True
2148,WT1,"oncogene, TSG, fusion",1.0,Yes,Yes,Yes,Yes,Yes,Yes,Yes,Yes,True
