# Trans effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the trans effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import gseapy as gp
import os
import IPython.display

In [2]:
def run_enrichr_reactome(input_file, cancer_type=None):

    input_df = pd.read_csv(input_file, sep="\t")
    
    if cancer_type is not None:
        cancer_df = input_df[input_df["cancers"].str.contains(cancer_type)]
        protein_list = cancer_df["protein"].tolist()
    else:
        protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=os.path.join("gene_set_libraries", "ReactomePathways.gmt"),
        background="hsapiens_gene_ensembl",
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

In [3]:
def run_enrichr_go(input_file, cancer_type=None):

    input_df = pd.read_csv(input_file, sep="\t")
    
    if cancer_type is not None:
        cancer_df = input_df[input_df["cancers"].str.contains(cancer_type)]
        protein_list = cancer_df["protein"].tolist()
    else:
        protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

### 8q trans effects in BRCA

In [4]:
run_enrichr_reactome("pancancer_summary_8q_trans.tsv", cancer_type="brca")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Genes
694,CUSTOM140134296622896,Mitochondrial translation elongation (R-HSA-53...,57/91,1.493286e-43,2.077161e-40,MRPS15;MRPL40;MRPS23;MRPL14;MRPL11;DAP3;MRPS27...
695,CUSTOM140134296622896,Mitochondrial translation initiation (R-HSA-53...,56/91,3.459842e-42,1.604213e-39,MRPS15;MRPL40;MRPS23;MRPL14;MRPL11;DAP3;MRPS27...
696,CUSTOM140134296622896,Mitochondrial translation termination (R-HSA-5...,56/91,3.459842e-42,1.604213e-39,MRPS15;MRPL40;MRPS23;MRPL14;MRPL11;DAP3;MRPS27...
693,CUSTOM140134296622896,Mitochondrial translation (R-HSA-5368287),57/97,2.575635e-41,8.956769e-39,MRPS15;MRPL40;MRPS23;MRPL14;MRPL11;DAP3;MRPS27...
657,CUSTOM140134296622896,Membrane Trafficking (R-HSA-199991),113/611,8.802457e-23,2.448843e-20,COPG1;COG6;EXOC3;SAR1B;LMAN2;KIF2C;BET1L;CHMP3...
586,CUSTOM140134296622896,Intra-Golgi and retrograde Golgi-to-ER traffic...,53/186,1.124774e-19,2.607601e-17,KIF19;COPE;MAN2A1;GCC2;COPG1;COG2;COPG2;COG4;R...
165,CUSTOM140134296622896,"Cell Cycle, Mitotic (R-HSA-69278)",97/530,2.380267e-19,4.729931e-17,NEK9;CDK1;MCM2;CENPU;NDC80;BIRC5;HMMR;PTK6;HAU...
1340,CUSTOM140134296622896,Vesicle-mediated transport (R-HSA-5653656),117/730,2.259471e-18,3.928655e-16,COPG1;COG6;EXOC3;SAR1B;LMAN2;KIF2C;BET1L;CHMP3...
163,CUSTOM140134296622896,Cell Cycle (R-HSA-1640170),109/662,4.789423e-18,7.402319e-16,NEK9;CDK1;MCM2;CENPU;NDC80;BIRC5;HMMR;PTK6;HAU...
344,CUSTOM140134296622896,ER to Golgi Anterograde Transport (R-HSA-199977),41/136,1.761880e-16,2.450775e-14,COPE;COPG1;SEC13;COG2;COPG2;COG4;ARFGAP3;DCTN6...


In [5]:
run_enrichr_go("pancancer_summary_8q_trans.tsv", cancer_type="brca")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,mitochondrial translational elongation (GO:007...,57/87,2.249898e-46,1.148123e-42,0,0,10.056369,1.057005e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS14;MRPS11;MRPS12...
1,GO_Biological_Process_2018,mitochondrial translational termination (GO:00...,56/89,4.055167e-44,1.034676e-40,0,0,9.657920,9.649590e+02,MRPS17;MRPS15;MRPS16;MRPS14;MRPS11;MRPS12;MRPL...
2,GO_Biological_Process_2018,translational termination (GO:0006415),57/96,7.783892e-43,1.324040e-39,0,0,9.113584,8.836449e+02,MRPS17;MRPS15;MRPS16;MRPS14;MRPS11;MRPS12;MRPL...
3,GO_Biological_Process_2018,translational elongation (GO:0006414),58/105,4.348452e-41,5.547538e-38,0,0,8.478602,7.879688e+02,MRPS17;MRPS15;GFM1;MRPS16;MRPS14;MRPS11;MRPS12...
4,GO_Biological_Process_2018,mitochondrial translation (GO:0032543),58/107,1.847348e-40,1.885404e-37,0,0,8.320124,7.612052e+02,MRPS17;MRPS15;GFM1;MRPS16;MRPS14;MRPS11;MRPS12...
5,GO_Biological_Process_2018,Golgi vesicle transport (GO:0048193),70/271,4.686345e-24,3.985736e-21,0,0,3.964737,2.129753e+02,SNAP23;GCC2;MIA3;KIF11;KIF15;ACTR1A;GOLGA5;TME...
6,GO_Biological_Process_2018,"retrograde vesicle-mediated transport, Golgi t...",31/80,7.687475e-17,5.604169e-14,0,0,5.947813,2.206898e+02,COPB2;NBAS;COPA;RAB1B;COPB1;STX18;KIF11;KIF15;...
7,GO_Biological_Process_2018,ER to Golgi vesicle-mediated transport (GO:000...,45/180,2.362762e-15,1.507147e-12,0,0,3.837299,1.292362e+02,DCTN6;COPB2;SPTBN4;DCTN5;COPA;LMAN2L;PEF1;SAR1...
8,GO_Biological_Process_2018,rRNA processing (GO:0006364),47/202,1.089461e-14,6.177243e-12,0,0,3.571347,1.148206e+02,DDX27;DDX47;WDR3;MRPS12;ISG20L2;NAT10;NOL8;TFB...
9,GO_Biological_Process_2018,ribosome biogenesis (GO:0042254),49/226,5.506732e-14,2.810085e-11,0,0,3.327923,1.016022e+02,DDX47;PAK1IP1;WDR3;MRPS12;WDR43;RRP9;FBL;MTG1;...
