# Cis effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the cis effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import cptac.utils as ut
import gseapy as gp

In [2]:
def run_enrichr(input_file):

    input_df = pd.read_csv(input_file, sep="\t")
    protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

### 8p cis effects

In [3]:
run_enrichr("pancancer_summary_8p_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,protein localization to chromosome (GO:0034502),3/27,0.000058,0.295892,0,0,39.682540,387.116807,TNKS;PINX1;CHMP7
5,GO_Biological_Process_2018,protein dephosphorylation (GO:0006470),4/125,0.000415,0.353305,0,0,11.428571,88.985703,PPP2CB;PPP3CC;PPP2R2A;MTMR7
4,GO_Biological_Process_2018,dephosphorylation (GO:0016311),4/124,0.000403,0.411249,0,0,11.520737,90.054170,PPP2CB;PPP3CC;PPP2R2A;MTMR7
12,GO_Biological_Process_2018,nuclear envelope reassembly (GO:0031468),2/18,0.001145,0.449339,0,0,39.682540,268.754478,PPP2R2A;CHMP7
11,GO_Biological_Process_2018,lipid biosynthetic process (GO:0008610),3/72,0.001081,0.459893,0,0,14.880952,101.628542,AGPAT5;LPL;FDFT1
10,GO_Biological_Process_2018,negative regulation of telomere maintenance (G...,2/17,0.001019,0.472881,0,0,42.016807,289.436971,TNKS;PINX1
3,GO_Biological_Process_2018,regulation of telomere maintenance via telomer...,3/51,0.000394,0.502192,0,0,21.008403,164.707201,HMBOX1;TNKS;PINX1
7,GO_Biological_Process_2018,"protein localization to chromosome, telomeric ...",2/15,0.000790,0.503808,0,0,47.619048,340.176271,TNKS;PINX1
13,GO_Biological_Process_2018,viral budding via host ESCRT complex (GO:0039702),2/20,0.001416,0.516288,0,0,35.714286,234.272062,VPS37A;CHMP7
9,GO_Biological_Process_2018,regulation of telomere maintenance via telomer...,2/17,0.001019,0.520169,0,0,42.016807,289.436971,TNKS;PINX1


### 8q cis effects

In [4]:
run_enrichr("pancancer_summary_8q_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,positive regulation of protein ubiquitination ...,4/83,0.000311,1.0,0,0,12.357121,99.776638,RNF139;RIPK2;DERL1;TSPYL5
381,GO_Biological_Process_2018,endosomal transport (GO:0016197),2/229,0.224677,1.0,0,0,2.239391,3.343611,SNX16;CHMP4C
380,GO_Biological_Process_2018,fatty acid catabolic process (GO:0009062),1/65,0.224621,1.0,0,0,3.944773,5.890894,DECR1
379,GO_Biological_Process_2018,glycerophospholipid metabolic process (GO:0006...,1/64,0.221575,1.0,0,0,4.006410,6.037633,CPNE3
378,GO_Biological_Process_2018,ribosome biogenesis (GO:0042254),2/226,0.220374,1.0,0,0,2.269117,3.431883,MTERF3;DCAF13
377,GO_Biological_Process_2018,"nuclear-transcribed mRNA catabolic process, de...",1/63,0.218518,1.0,0,0,4.070004,6.190019,PABPC1
376,GO_Biological_Process_2018,negative regulation of dephosphorylation (GO:0...,1/63,0.218518,1.0,0,0,4.070004,6.190019,PLEKHF2
375,GO_Biological_Process_2018,regulation of proteolysis (GO:0030162),1/63,0.218518,1.0,0,0,4.070004,6.190019,RNF139
374,GO_Biological_Process_2018,regulation of viral genome replication (GO:004...,1/63,0.218518,1.0,0,0,4.070004,6.190019,PABPC1
373,GO_Biological_Process_2018,positive regulation of catabolic process (GO:0...,1/62,0.215449,1.0,0,0,4.135649,6.348359,WWP1
