# Trans effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the trans effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import gseapy as gp
import os
import IPython.display

In [2]:
def run_enrichr_reactome(input_file, cancer_type=None):

    input_df = pd.read_csv(input_file, sep="\t")
    
    if cancer_type is not None:
        cancer_df = input_df[input_df["cancers"].str.contains(cancer_type)]
        protein_list = cancer_df["protein"].tolist()
    else:
        protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=os.path.join("gene_set_libraries", "ReactomePathways.gmt"),
        background="hsapiens_gene_ensembl",
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

In [3]:
def run_enrichr_go(input_file, cancer_type=None):

    input_df = pd.read_csv(input_file, sep="\t")
    
    if cancer_type is not None:
        cancer_df = input_df[input_df["cancers"].str.contains(cancer_type)]
        protein_list = cancer_df["protein"].tolist()
    else:
        protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

### 8q trans effects in BRCA

In [4]:
run_enrichr_reactome("pancancer_summary_8q_trans.tsv", cancer_type="brca")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Genes
721,CUSTOM139897129435040,Mitochondrial translation elongation (R-HSA-53...,66/91,2.317373e-55,3.318478e-52,MRPL53;MRPL3;MRPS25;MRPL32;MRPL49;MRPL14;MRPL4...
722,CUSTOM139897129435040,Mitochondrial translation initiation (R-HSA-53...,65/91,7.967065e-54,3.802946e-51,MRPL53;MRPL3;MRPS25;MRPL32;MRPL49;MRPL14;MRPL4...
720,CUSTOM139897129435040,Mitochondrial translation (R-HSA-5368287),67/97,6.970485e-54,3.802946e-51,MRPL53;MRPL3;MRPS25;MRPL32;MRPL49;MRPL14;MRPL4...
723,CUSTOM139897129435040,Mitochondrial translation termination (R-HSA-5...,64/91,2.595649e-52,9.292422e-50,MRPL53;MRPL3;MRPS25;MRPL32;MRPL49;MRPL14;MRPL4...
1334,CUSTOM139897129435040,Translation (R-HSA-72766),70/303,1.050871e-18,3.009695e-16,MRPL53;MRPL3;MRPS25;MRPL32;YARS2;MRPL49;MRPL14...
683,CUSTOM139897129435040,Membrane Trafficking (R-HSA-199991),108/611,1.280923e-18,3.057136e-16,YKT6;EXOC8;KIF13B;TRAPPC6B;MIA3;CHMP2A;RAB3GAP...
168,CUSTOM139897129435040,"Cell Cycle, Mitotic (R-HSA-69278)",98/530,2.347198e-18,4.801697e-16,PPP2R2A;KNTC1;NUP153;CHMP2A;SMC3;TK1;NEK9;RFC5...
166,CUSTOM139897129435040,Cell Cycle (R-HSA-1640170),108/662,4.734794e-16,8.475281e-14,PPP2R2A;KNTC1;NUP153;CHMP2A;SMC3;TK1;NEK9;RFC5...
1379,CUSTOM139897129435040,Vesicle-mediated transport (R-HSA-5653656),115/730,6.872895e-16,1.093554e-13,YKT6;EXOC8;KIF13B;TRAPPC6B;MIA3;CHMP2A;RAB3GAP...
702,CUSTOM139897129435040,Metabolism of proteins (R-HSA-392499),239/2017,1.059699e-15,1.517490e-13,YKT6;EXOC8;CEBPG;TRAPPC6B;MIA3;NUP153;DAP3;MRP...


In [5]:
run_enrichr_go("pancancer_summary_8q_trans.tsv", cancer_type="brca")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,mitochondrial translational elongation (GO:007...,66/87,6.015934e-59,3.069931e-55,0,0,11.074755,1.484661e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS11;MRPS12;MRPL38...
1,GO_Biological_Process_2018,mitochondrial translation (GO:0032543),70/107,3.727789e-55,9.511453e-52,0,0,9.550447,1.196923e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS11;MRPS12;MRPL38...
2,GO_Biological_Process_2018,mitochondrial translational termination (GO:00...,64/89,1.188620e-54,2.021843e-51,0,0,10.497827,1.303482e+03,MRPS17;MRPS15;MRPS16;MRPS11;MRPS12;MRPL38;MRPL...
3,GO_Biological_Process_2018,translational termination (GO:0006415),65/96,9.109382e-53,1.162129e-49,0,0,9.884428,1.184428e+03,MRPS17;MRPS15;MRPS16;MRPS11;MRPS12;MRPL38;MRPL...
4,GO_Biological_Process_2018,translational elongation (GO:0006414),67/105,9.506891e-52,9.702733e-49,0,0,9.315259,1.094379e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS11;MRPS12;MRPL38...
5,GO_Biological_Process_2018,mitochondrial gene expression (GO:0140053),26/45,2.921079e-19,2.484378e-16,0,0,8.434712,3.599696e+02,MRPS17;MRPS15;MRPS16;MRPS11;MRPS12;MRPS34;MRPL...
6,GO_Biological_Process_2018,Golgi vesicle transport (GO:0048193),64/271,8.995753e-19,6.557904e-16,0,0,3.447626,1.432570e+02,SNAP23;GCC2;MIA3;KIF11;KIF15;ACTR1A;CTSC;SCYL1...
7,GO_Biological_Process_2018,mitotic sister chromatid segregation (GO:0000070),29/82,4.680762e-14,2.985741e-11,0,0,5.162898,1.584634e+02,CDCA5;AKAP8L;KIF14;NCAPG;CDCA8;PDS5A;SMC4;NCAP...
8,GO_Biological_Process_2018,ribosome biogenesis (GO:0042254),50/226,9.081594e-14,5.149264e-11,0,0,3.229766,9.698967e+01,DDX47;PAK1IP1;RPP30;WDR3;MRPS12;WDR43;RRP9;FBL...
9,GO_Biological_Process_2018,rRNA processing (GO:0006364),46/202,2.953424e-13,1.507132e-10,0,0,3.324420,9.591165e+01,DDX27;DDX47;RPP30;WDR3;MRPS12;ISG20L2;NAT10;TF...
