# Cis effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the cis effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import cptac.utils as ut
import gseapy as gp



In [2]:
def run_enrichr(input_file):

    input_df = pd.read_csv(input_file, sep="\t")
    protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

### 8p cis effects

In [3]:
run_enrichr("pancancer_summary_8p_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,protein localization to chromosome (GO:0034502),3/27,0.000061,0.312050,0,0,38.986355,378.252452,TNKS;PINX1;CHMP7
5,GO_Biological_Process_2018,protein dephosphorylation (GO:0006470),4/125,0.000445,0.378146,0,0,11.228070,86.661608,PPP2CB;PPP3CC;PPP2R2A;MTMR7
4,GO_Biological_Process_2018,dephosphorylation (GO:0016311),4/124,0.000431,0.440182,0,0,11.318619,87.704732,PPP2CB;PPP3CC;PPP2R2A;MTMR7
12,GO_Biological_Process_2018,nuclear envelope reassembly (GO:0031468),2/18,0.001186,0.465430,0,0,38.986355,262.667728,PPP2R2A;CHMP7
11,GO_Biological_Process_2018,lipid biosynthetic process (GO:0008610),3/72,0.001139,0.484196,0,0,14.619883,99.092734,AGPAT5;LPL;FDFT1
10,GO_Biological_Process_2018,negative regulation of telomere maintenance (G...,2/17,0.001056,0.489832,0,0,41.279670,282.905308,TNKS;PINX1
7,GO_Biological_Process_2018,"protein localization to chromosome, telomeric ...",2/15,0.000818,0.521903,0,0,46.783626,332.557495,TNKS;PINX1
3,GO_Biological_Process_2018,regulation of telomere maintenance via telomer...,3/51,0.000415,0.529141,0,0,20.639835,160.738684,HMBOX1;TNKS;PINX1
13,GO_Biological_Process_2018,viral budding via host ESCRT complex (GO:0039702),2/20,0.001467,0.534741,0,0,35.087719,228.929770,VPS37A;CHMP7
9,GO_Biological_Process_2018,regulation of telomere maintenance via telomer...,2/17,0.001056,0.538815,0,0,41.279670,282.905308,TNKS;PINX1


### 8q cis effects

In [4]:
run_enrichr("pancancer_summary_8q_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,positive regulation of protein ubiquitination ...,4/83,0.000205,1.0,0,0,13.769363,116.918454,RNF139;RIPK2;DERL1;TSPYL5
385,GO_Biological_Process_2018,mitochondrial respiratory chain complex I asse...,1/64,0.201282,1.0,0,0,4.464286,7.156469,NDUFAF6
384,GO_Biological_Process_2018,mitochondrial respiratory chain complex I biog...,1/64,0.201282,1.0,0,0,4.464286,7.156469,NDUFAF6
383,GO_Biological_Process_2018,glycerophospholipid metabolic process (GO:0006...,1/64,0.201282,1.0,0,0,4.464286,7.156469,CPNE3
382,GO_Biological_Process_2018,NADH dehydrogenase complex assembly (GO:0010257),1/64,0.201282,1.0,0,0,4.464286,7.156469,NDUFAF6
381,GO_Biological_Process_2018,"RNA splicing, via transesterification reaction...",2/236,0.200084,1.0,0,0,2.421308,3.895933,PABPC1;POLR2K
380,GO_Biological_Process_2018,"nuclear-transcribed mRNA catabolic process, de...",1/63,0.198468,1.0,0,0,4.535147,7.333919,PABPC1
379,GO_Biological_Process_2018,negative regulation of dephosphorylation (GO:0...,1/63,0.198468,1.0,0,0,4.535147,7.333919,PLEKHF2
378,GO_Biological_Process_2018,regulation of proteolysis (GO:0030162),1/63,0.198468,1.0,0,0,4.535147,7.333919,RNF139
377,GO_Biological_Process_2018,regulation of viral genome replication (GO:004...,1/63,0.198468,1.0,0,0,4.535147,7.333919,PABPC1
