# Trans effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the trans effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import gseapy as gp
import os
import IPython.display

In [2]:
def run_enrichr_reactome(input_file, cancer_type=None):

    input_df = pd.read_csv(input_file, sep="\t")
    
    if cancer_type is not None:
        cancer_df = input_df[input_df["cancers"].str.contains(cancer_type)]
        protein_list = cancer_df["protein"].tolist()
    else:
        protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=os.path.join("gene_set_libraries", "ReactomePathways.gmt"),
        background="hsapiens_gene_ensembl",
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

In [3]:
def run_enrichr_go(input_file, cancer_type=None):

    input_df = pd.read_csv(input_file, sep="\t")
    
    if cancer_type is not None:
        cancer_df = input_df[input_df["cancers"].str.contains(cancer_type)]
        protein_list = cancer_df["protein"].tolist()
    else:
        protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

### 8q trans effects in BRCA

In [4]:
run_enrichr_reactome("pancancer_summary_8q_trans.tsv", cancer_type="brca")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Genes
726,CUSTOM140132511690416,Mitochondrial translation elongation (R-HSA-53...,66/91,1.421481e-52,2.039825e-49,MRPS27;MRPL57;MRPL2;MRPL12;MRPS5;MRPS22;MRPS31...
727,CUSTOM140132511690416,Mitochondrial translation initiation (R-HSA-53...,65/91,4.376071e-51,2.178603e-48,MRPS27;MRPL57;MRPL2;MRPL12;MRPS5;MRPS22;MRPS31...
725,CUSTOM140132511690416,Mitochondrial translation (R-HSA-5368287),67/97,4.554572e-51,2.178603e-48,MRPS27;MRPL57;MRPL2;MRPL12;MRPS5;MRPS22;MRPS31...
728,CUSTOM140132511690416,Mitochondrial translation termination (R-HSA-5...,64/91,1.276756e-49,4.580361e-47,MRPS27;MRPL57;MRPL2;MRPL12;MRPS5;MRPS22;MRPS31...
687,CUSTOM140132511690416,Membrane Trafficking (R-HSA-199991),120/611,5.350261e-21,1.535525e-18,ARCN1;RIN2;EXOC2;TMF1;AKT1;KIF13B;SCFD1;SBF2;T...
171,CUSTOM140132511690416,"Cell Cycle, Mitotic (R-HSA-69278)",105/530,8.934073e-19,2.136733e-16,MCM2;NCAPH2;CDCA8;AKT1;CDC20;CEP250;KIF20A;CHM...
1382,CUSTOM140132511690416,Vesicle-mediated transport (R-HSA-5653656),127/730,1.370555e-17,2.809639e-15,COL3A1;COL1A1;ARCN1;RIN2;EXOC2;TMF1;AKT1;KIF13...
1335,CUSTOM140132511690416,Translation (R-HSA-72766),71/303,5.101881e-17,9.151499e-15,MRPS27;MRPL57;MRPL2;MRPL12;MRPS5;MRPS22;MRPS31...
169,CUSTOM140132511690416,Cell Cycle (R-HSA-1640170),117/662,8.392076e-17,1.338070e-14,MCM2;NCAPH2;CDCA8;AKT1;CDC20;BABAM1;CEP250;CHT...
258,CUSTOM140132511690416,DNA strand elongation (R-HSA-69190),21/32,3.756979e-16,5.391265e-14,MCM3;MCM6;POLA1;MCM2;GINS1;RFC5;MCM5;GINS4;POL...


In [5]:
run_enrichr_go("pancancer_summary_8q_trans.tsv", cancer_type="brca")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,mitochondrial translational elongation (GO:007...,66/87,3.844220e-56,1.379306e-52,0,0,40.167672,5.125322e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS11;MRPS12;MRPL38...
1,GO_Biological_Process_2018,mitochondrial translation (GO:0032543),70/107,3.187238e-52,5.717905e-49,0,0,24.225669,2.872565e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS11;MRPS12;MRPL38...
2,GO_Biological_Process_2018,mitochondrial translational termination (GO:00...,64/89,6.004530e-52,7.181417e-49,0,0,32.666095,3.852702e+03,MRPS17;MRPS15;MRPS16;MRPS11;MRPS12;MRPL38;MRPL...
3,GO_Biological_Process_2018,translational elongation (GO:0006414),68/105,2.586287e-50,2.319900e-47,0,0,23.500890,2.683309e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS11;MRPS12;MRPL38...
4,GO_Biological_Process_2018,translational termination (GO:0006415),65/96,4.874575e-50,3.497995e-47,0,0,26.765047,3.039043e+03,MRPS17;MRPS15;MRPS16;MRPS11;MRPS12;MRPL38;MRPL...
5,GO_Biological_Process_2018,Golgi vesicle transport (GO:0048193),71/271,4.685156e-21,2.801723e-18,0,0,4.508747,2.110539e+02,SNAP23;GCC2;MIA3;KIF11;KIF15;ACTR1A;GOLGA5;TME...
6,GO_Biological_Process_2018,mitochondrial gene expression (GO:0140053),26/45,3.321637e-18,1.702576e-15,0,0,17.020025,6.849892e+02,MRPS17;MRPS15;MRPS16;MRPS11;MRPS12;MRPS34;MRPL...
7,GO_Biological_Process_2018,endosomal transport (GO:0016197),58/229,1.057750e-16,4.744011e-14,0,0,4.276065,1.572960e+02,DENND1A;ARHGAP1;DPY30;GCC2;AP2A1;PTPN23;EEA1;A...
8,GO_Biological_Process_2018,ER to Golgi vesicle-mediated transport (GO:000...,50/180,2.402432e-16,9.577695e-14,0,0,4.833096,1.738217e+02,MIA3;ACTR1A;TMED5;CTSC;NSF;COG8;COG7;COG6;COG5...
9,GO_Biological_Process_2018,ribosome biogenesis (GO:0042254),55/226,4.215815e-15,1.512634e-12,0,0,4.046535,1.339400e+02,DDX47;PAK1IP1;RPP30;WDR3;MRPS12;WDR43;RRP9;FBL...
