# This notebook validates the presence (or lack thereof) of the KANSL1 gene and other genes found in our mechanistic model in the KEGG, Reactome and WikiPathways databases.

In [1]:
import os
import sys

import pybel
from pybel.constants import GENE, PROTEIN, RNA
from pybel_jupyter import to_jupyter

  reference_seq = oneOf(['r', 'p', 'c'])
  dna_nucleotide = oneOf(list(language.dna_nucleotide_labels.keys()))
  aa_single = oneOf(list(language.amino_acid_dict.keys()))
  pmod_legacy_ns = oneOf(list(pmod_legacy_labels)).setParseAction(_handle_pmod_legacy_ns)


In [2]:
sys.version

'3.6.8 (default, Aug  7 2019, 19:55:42) \n[GCC 4.8.5 20150623 (Red Hat 4.8.5-39)]'

In [3]:
pybel.get_version()

'0.13.2'

In [4]:
pathme_directory = os.path.join(os.getenv("HOME"),'.pathme')

kegg_path = os.path.join(pathme_directory, 'kegg', 'bel')
reactome_path = os.path.join(pathme_directory, 'reactome', 'bel')
wikipathways_path = os.path.join(pathme_directory, 'wikipathways', 'bel')

In [5]:
def get_pathway_from_pickles(path):
    """Get pathway bel graphs from pathway pickles directory
    
    :path: str path to pickles directory 
    """
    pathways = set()

    for file in os.listdir(path):

        pathway = pybel.from_pickle(os.path.join(path,file))
        pathways.add(pathway)

    return pathways

In [6]:
kegg_pathways = get_pathway_from_pickles(kegg_path)
reactome_pathways = get_pathway_from_pickles(reactome_path)
wp_pathways = get_pathway_from_pickles(wikipathways_path)

In [7]:
def get_pathway_containing_node(pathway, query_node):
    """Get pathway if the query node is present in it.
    
    :graph: BEL graph
    :query_node: specific node to search
    """    
    for node in pathway:

        if node.function == PROTEIN or node.function == GENE or node.function == RNA:

            if query_node == node.name:

                return pathway
            

def check_pathways_for_query_node(pathway_set, query_node):
    """Get all the pathways in a set of pathways that contains the query node
    
    :pathway_set: set of pathways
    :query_node: specific node to search
    """   
    pathways_with_query_node = set()
    
    for pathway in pathway_set:
                
        bel_graph = get_pathway_containing_node(pathway, query_node)
                
        if bel_graph:
            
            pathways_with_query_node.add(bel_graph.name)
        
    return pathways_with_query_node


#### Querying genes from our mechanistic model in pathway databases 

Query KANSL1 in the 3 databases

In [8]:
kansl1_in_kegg_pathways = check_pathways_for_query_node(kegg_pathways, 'KANSL1')
kansl1_in_reactome_pathways = check_pathways_for_query_node(reactome_pathways, 'KANSL1')
kansl1_in_wp_pathways = check_pathways_for_query_node(wp_pathways, 'KANSL1')

|Gene|KEGG Pathway|Reactome Pathway|WikiPathways Pathway|
|----|------------|----------------|--------------------|
|KANSL1|NA|NA|NA|

Query BDNF in the 3 databases

In [9]:
BDNF_in_kegg_pathways = check_pathways_for_query_node(kegg_pathways, 'BDNF')
BDNF_in_reactome_pathways = check_pathways_for_query_node(reactome_pathways, 'BDNF')
BDNF_in_wp_pathways = check_pathways_for_query_node(wp_pathways, 'BDNF')

|Gene|KEGG Pathway|Reactome Pathway|WikiPathways Pathway|
|----|------------|----------------|--------------------|
|BDNF|Alcoholism|Activated NTRK2 signals through CDK5|BDNF-TrkB Signaling|
|BDNF|Cocaine addiction|Activated NTRK2 signals through FYN|Brain-Derived Neurotrophic Factor (BDNF) signaling pathway|
|BDNF|Huntington disease|BDNF activates NTRK2 (TRKB) signaling|ERK Pathway in Huntington's Disease|
|BDNF|MAPK signaling pathway|MECP2 regulates transcription of neuronal ligands|MECP2 and Associated Rett Syndrome|
|BDNF|Neurotrophin signaling pathway|NTRK2 activates RAC1|Prader-Willi and Angelman Syndrome|
|BDNF|PI3K-Akt signaling pathway|NA|Spinal Cord Injury|
|BDNF|Ras signaling pathway|NA|Sudden Infant Death Syndrome (SIDS) Susceptibility Pathways|
|BDNF|cAMP signaling pathway|NA|Synaptic signaling pathways associated with autism spectrum disorder|

Query the BTG2 gene in the 3 databases

In [10]:
BTG2_in_kegg_pathways = check_pathways_for_query_node(kegg_pathways, 'BTG2')
BTG2_in_reactome_pathways = check_pathways_for_query_node(reactome_pathways, 'BTG2')
BTG2_in_wp_pathways = check_pathways_for_query_node(wp_pathways, 'BTG2')

|Gene|KEGG Pathway|Reactome Pathway|WikiPathways Pathway|
|----|------------|----------------|--------------------|
|BTG2|RNA degradation|NA|NA|

Query KAT8 in the 3 databases

In [11]:
KAT8_in_kegg_pathways = check_pathways_for_query_node(kegg_pathways, 'KAT8')
KAT8_in_reactome_pathways = check_pathways_for_query_node(reactome_pathways, 'KAT8')
KAT8_in_wp_pathways = check_pathways_for_query_node(wp_pathways, 'KAT8')

|Gene|KEGG Pathway|Reactome Pathway|WikiPathways Pathway|
|----|------------|----------------|--------------------|
|KAT8|NA|NA|NA|

Query the MAPT gene in the 3 databases

In [12]:
MAPT_in_kegg_pathways = check_pathways_for_query_node(kegg_pathways, 'MAPT')
MAPT_in_reactome_pathways = check_pathways_for_query_node(reactome_pathways, 'MAPT')
MAPT_in_wp_pathways = check_pathways_for_query_node(wp_pathways, 'MAPT')

|Gene|KEGG Pathway|Reactome Pathway|WikiPathways Pathway|
|----|------------|----------------|--------------------|
|MAPT|Alzheimer disease|NA|Alzheimers Disease|
|MAPT|MAPK signaling pathway|NA|Brain-Derived Neurotrophic Factor (BDNF) signaling pathway|
|MAPT|NA|NA|Copper homeostasis|
|MAPT|NA|NA|IL-2 Signaling Pathway|
|MAPT|NA|NA|IL-5 Signaling Pathway|
|MAPT|NA|NA|Kit receptor signaling pathway|
|MAPT|NA|NA|Notch Signaling Pathway|
|MAPT|NA|NA|Regulation of Microtubule Cytoskeleton|

Query TP53 in the 3 databases

In [13]:
TP53_in_kegg_pathways = check_pathways_for_query_node(kegg_pathways, 'TP53')
TP53_in_reactome_pathways = check_pathways_for_query_node(reactome_pathways, 'TP53')
TP53_in_wp_pathways = check_pathways_for_query_node(wp_pathways, 'TP53')

|Gene|KEGG Pathway|Reactome Pathway|WikiPathways Pathway|
|----|------------|----------------|--------------------|
|TP53|Amyotrophic lateral sclerosis (ALS)|DNA Damage/Telomere Stress Induced Senescence|ATM Signaling Pathway|
|TP53|Apoptosis|Factors involved in megakaryocyte development and platelet production|Alzheimers Disease|
|TP53|Basal cell carcinoma|G2/M DNA damage checkpoint|Apoptosis|
|TP53|Bladder cancer|Oncogene Induced Senescence|Cell Cycle|
|TP53|Breast cancer|Oxidative Stress Induced Senescence|Copper homeostasis|
|TP53|Cell cycle|Pre-NOTCH Transcription and Translation|DNA Damage Response|
|TP53|Cellular senescence|RUNX3 regulates CDKN1A transcription|DNA Damage Response (only ATM dependent)|
|TP53|Central carbon metabolism in cancer|Recruitment and ATM-mediated phosphorylation of repair and signaling proteins at DNA double strand breaks|DNA IR-Double Strand Breaks (DSBs) and cellular response via ATM|
|TP53|Chronic myeloid leukemia|Regulation of PTEN gene transcription|DNA IR-damage and cellular response via ATR|
|TP53|Colorectal cancer|Regulation of TP53 Activity through Association with Co-factors|Endometrial cancer|
|TP53|Endocrine resistance|Regulation of TP53 Activity through Methylation|ErbB Signaling Pathway|
|TP53|Endometrial cancer|Regulation of TP53 Activity through Phosphorylation|G1 to S cell cycle control|
|TP53|Epstein-Barr virus infection|Regulation of TP53 Degradation|Gastric Cancer Network 2|
|TP53|Ferroptosis|Regulation of TP53 Expression|Hepatitis C and Hepatocellular Carcinoma|
|TP53|Fluid shear stress and atherosclerosis|SUMOylation of transcription factors|Hereditary leiomyomatosis and renal cell carcinoma pathway|
|TP53|Gastric cancer|Stabilization of p53|Integrated Breast Cancer Pathway|
|TP53|Glioma|TP53 Regulates Metabolic Genes|Integrated Cancer Pathway|
|TP53|Hepatitis B|Ub-specific processing proteases|Mammary gland development pathway - Involution (Stage 4 of 4)|
|TP53|Hepatitis C|NA|Metastatic brain tumor|
|TP53|Hepatocellular carcinoma|NA|PI3K-Akt Signaling Pathway|
|TP53|Herpes simplex virus 1 infection|NA|Pathways Affected in Adenoid Cystic Carcinoma|
|TP53|Human T-cell leukemia virus 1 infection|NA|Prader-Willi and Angelman Syndrome|
|TP53|Human cytomegalovirus infection|NA|Retinoblastoma Gene in Cancer|
|TP53|Human papillomavirus infection|NA|Senescence and Autophagy in Cancer|
|TP53|Huntington disease|NA|Signaling Pathways in Glioblastoma|
|TP53|Kaposi sarcoma-associated herpesvirus infection|NA|Spinal Cord Injury|
|TP53|Longevity regulating pathway|NA|TP53 Network|
|TP53|MAPK signaling pathway|NA|The effect of progerin on the involved genes in Hutchinson-Gilford Progeria Syndrome|
|TP53|Measles|NA|Wnt Signaling Pathway and Pluripotency|
|TP53|Melanoma|NA|miRNA Regulation of DNA Damage Response|
|TP53|MicroRNAs in cancer|NA|miRNA regulation of p53 pathway in prostate cancer|
|TP53|Mitophagy - animal|NA|miRNA regulation of prostate cancer signaling pathways|
|TP53|Neurotrophin signaling pathway|NA|NA|
|TP53|Non-small cell lung cancer|NA|NA|
|TP53|PI3K-Akt signaling pathway|NA|NA|
|TP53|Pancreatic cancer|NA|NA|
|TP53|Pathways in cancer|NA|NA|
|TP53|Platinum drug resistance|NA|NA|
|TP53|Prostate cancer|NA|NA|
|TP53|Proteoglycans in cancer|NA|NA|
|TP53|Shigellosis|NA|NA|
|TP53|Small cell lung cancer|NA|NA|
|TP53|Sphingolipid signaling pathway|NA|NA|
|TP53|Thyroid cancer|NA|NA|
|TP53|Thyroid hormone signaling pathway|NA|NA|
|TP53|Transcriptional misregulation in cancer|NA|NA|
|TP53|Viral carcinogenesis|NA|NA|
|TP53|Wnt signaling pathway|NA|NA|
|TP53|p53 signaling pathway|NA|NA|