# Cis effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the cis effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import cptac.utils as ut
import gseapy as gp

In [2]:
def run_enrichr(input_file):

    input_df = pd.read_csv(input_file, sep="\t")
    protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

### 8p cis effects

In [3]:
run_enrichr("pancancer_summary_8p_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,protein localization to chromosome (GO:0034502),3/27,0.000058,0.295892,0,0,39.682540,387.116807,TNKS;PINX1;CHMP7
5,GO_Biological_Process_2018,protein dephosphorylation (GO:0006470),4/125,0.000415,0.353305,0,0,11.428571,88.985703,PPP2CB;PPP3CC;PPP2R2A;MTMR7
4,GO_Biological_Process_2018,dephosphorylation (GO:0016311),4/124,0.000403,0.411249,0,0,11.520737,90.054170,PPP2CB;PPP3CC;PPP2R2A;MTMR7
11,GO_Biological_Process_2018,nuclear envelope reassembly (GO:0031468),2/18,0.001145,0.486784,0,0,39.682540,268.754478,PPP2R2A;CHMP7
10,GO_Biological_Process_2018,lipid biosynthetic process (GO:0008610),3/72,0.001081,0.501702,0,0,14.880952,101.628542,AGPAT5;LPL;FDFT1
3,GO_Biological_Process_2018,regulation of telomere maintenance via telomer...,3/51,0.000394,0.502192,0,0,21.008403,164.707201,HMBOX1;TNKS;PINX1
9,GO_Biological_Process_2018,negative regulation of telomere maintenance (G...,2/17,0.001019,0.520169,0,0,42.016807,289.436971,TNKS;PINX1
12,GO_Biological_Process_2018,viral budding via host ESCRT complex (GO:0039702),2/20,0.001416,0.556002,0,0,35.714286,234.272062,VPS37A;CHMP7
1,GO_Biological_Process_2018,regulation of telomerase activity (GO:0051972),3/42,0.000221,0.563638,0,0,25.510204,214.739281,HMBOX1;TNKS;PINX1
6,GO_Biological_Process_2018,"protein localization to chromosome, telomeric ...",2/15,0.000790,0.575781,0,0,47.619048,340.176271,TNKS;PINX1


### 8q cis effects

In [4]:
run_enrichr("pancancer_summary_8q_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,positive regulation of protein ubiquitination ...,4/83,0.000254,1.0,0,0,13.025073,107.804811,RNF139;RIPK2;DERL1;TSPYL5
375,GO_Biological_Process_2018,positive regulation of autophagy (GO:0010508),1/67,0.220241,1.0,0,0,4.033885,6.103396,MTDH
374,GO_Biological_Process_2018,insulin receptor signaling pathway (GO:0008286),1/67,0.220241,1.0,0,0,4.033885,6.103396,ATP6V1C1
373,GO_Biological_Process_2018,"RNA splicing, via transesterification reaction...",2/236,0.217352,1.0,0,0,2.290426,3.495736,PABPC1;POLR2K
372,GO_Biological_Process_2018,negative regulation of epithelial cell prolife...,1/66,0.217336,1.0,0,0,4.095004,6.250253,MTSS1
371,GO_Biological_Process_2018,JNK cascade (GO:0007254),1/66,0.217336,1.0,0,0,4.095004,6.250253,RIPK2
370,GO_Biological_Process_2018,intracellular steroid hormone receptor signali...,1/66,0.217336,1.0,0,0,4.095004,6.250253,UBR5
369,GO_Biological_Process_2018,fatty acid catabolic process (GO:0009062),1/65,0.214420,1.0,0,0,4.158004,6.402579,DECR1
368,GO_Biological_Process_2018,activation of protein kinase activity (GO:0032...,2/233,0.213280,1.0,0,0,2.319916,3.584613,RIPK2;STK3
367,GO_Biological_Process_2018,translation (GO:0006412),2/232,0.211925,1.0,0,0,2.329916,3.614917,MTERF3;MRPL13
