# Cis effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the cis effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import cptac.utils as ut
import gseapy as gp

In [2]:
def run_enrichr(input_file):

    input_df = pd.read_csv(input_file, sep="\t")
    protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

### 8p cis effects

In [3]:
run_enrichr("pancancer_summary_8p_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,nuclear envelope reassembly (GO:0031468),3/18,0.000012,0.059619,0,0,66.666667,757.157764,REEP4;PPP2R2A;CHMP7
2,GO_Biological_Process_2018,mitotic nuclear envelope reassembly (GO:0007084),2/10,0.000272,0.462881,0,0,80.000000,656.740484,REEP4;PPP2R2A
1,GO_Biological_Process_2018,peptidyl-serine dephosphorylation (GO:0070262),2/10,0.000272,0.694322,0,0,80.000000,656.740484,PPP2CB;PPP2R2A
3,GO_Biological_Process_2018,glycerophospholipid biosynthetic process (GO:0...,4/164,0.000748,0.954581,0,0,9.756098,70.222173,AGPAT5;PLEKHA2;DDHD2;MTMR9
5,GO_Biological_Process_2018,viral budding via host ESCRT complex (GO:0039702),2/20,0.001131,0.961711,0,0,40.000000,271.394647,VPS37A;CHMP7
299,GO_Biological_Process_2018,peptidyl-threonine modification (GO:0018210),1/89,0.200101,1.000000,0,0,4.494382,7.231152,TNKS
298,GO_Biological_Process_2018,regulation of proteasomal ubiquitin-dependent ...,1/88,0.198088,1.000000,0,0,4.545455,7.359297,CCAR2
297,GO_Biological_Process_2018,T cell activation (GO:0042110),1/88,0.198088,1.000000,0,0,4.545455,7.359297,KIF13B
296,GO_Biological_Process_2018,regulation of protein targeting to mitochondri...,1/88,0.198088,1.000000,0,0,4.545455,7.359297,BAG4
295,GO_Biological_Process_2018,activation of GTPase activity (GO:0090630),1/84,0.189983,1.000000,0,0,4.761905,7.908661,ARHGEF10


### 8q cis effects

In [4]:
run_enrichr("pancancer_summary_8q_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
1,GO_Biological_Process_2018,ncRNA processing (GO:0034470),8/227,0.000114,0.291567,0,0,5.463921,49.595588,BOP1;EXOSC4;POP1;AGO2;RPS20;RPL8;DCAF13;RPL7
0,GO_Biological_Process_2018,ribosome biogenesis (GO:0042254),8/226,0.000111,0.565605,0,0,5.488098,49.982538,BOP1;EXOSC4;MTERF3;RRS1;RPS20;RPL8;DCAF13;RPL7
18,GO_Biological_Process_2018,cellular macromolecule biosynthetic process (G...,8/367,0.002649,0.711576,0,0,3.379591,20.052531,COPS5;AGO2;MCM4;RPS20;RPL8;MRPL13;POLR2K;RPL7
15,GO_Biological_Process_2018,mitochondrial ATP synthesis coupled electron t...,4/85,0.002235,0.712740,0,0,7.295942,44.531752,NDUFB9;UQCRB;CYC1;COX6C
17,GO_Biological_Process_2018,"regulation of protein import into nucleus, tra...",2/12,0.002612,0.740399,0,0,25.839793,153.689353,PARP10;UBR5
14,GO_Biological_Process_2018,double-strand break repair (GO:0006302),5/141,0.002218,0.754723,0,0,5.497828,33.596886,PRKDC;RAD21;NSMCE2;TONSL;UBE2V2
16,GO_Biological_Process_2018,retinol metabolic process (GO:0042572),2/12,0.002612,0.783952,0,0,25.839793,153.689353,SDR16C5;RDH10
20,GO_Biological_Process_2018,regulation of DNA metabolic process (GO:0051052),3/46,0.003250,0.789794,0,0,10.111223,57.927647,DSCC1;UBE2V2;GRHL2
22,GO_Biological_Process_2018,"mitochondrial electron transport, ubiquinol to...",2/14,0.003571,0.792215,0,0,22.148394,124.806482,UQCRB;CYC1
13,GO_Biological_Process_2018,regulation of nuclear-transcribed mRNA poly(A)...,2/11,0.002186,0.796642,0,0,28.188865,172.681515,AGO2;PABPC1
