# Cis effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the cis effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import cptac.utils as ut
import gseapy as gp

In [2]:
def run_enrichr(input_file):

    input_df = pd.read_csv(input_file, sep="\t")
    protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

### 8p cis effects

In [3]:
run_enrichr("pancancer_summary_8p_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,protein localization to chromosome (GO:0034502),3/27,0.000064,0.034598,0,0,45.268182,436.836353,TNKS;PINX1;CHMP7
1,GO_Biological_Process_2018,regulation of telomerase activity (GO:0051972),3/42,0.000245,0.042536,0,0,27.836364,231.418175,HMBOX1;TNKS;PINX1
2,GO_Biological_Process_2018,peptidyl-serine dephosphorylation (GO:0070262),2/10,0.000366,0.042536,0,0,88.991071,704.073961,PPP2CB;PPP2R2A
3,GO_Biological_Process_2018,regulation of telomere maintenance via telomer...,3/51,0.000437,0.042536,0,0,22.606818,174.897037,HMBOX1;TNKS;PINX1
4,GO_Biological_Process_2018,dephosphorylation (GO:0016311),4/124,0.000461,0.042536,0,0,12.235802,93.995725,PPP2CB;PPP3CC;PPP2R2A;MTMR7
5,GO_Biological_Process_2018,protein dephosphorylation (GO:0006470),4/125,0.000475,0.042536,0,0,12.134068,92.845636,PPP2CB;PPP3CC;PPP2R2A;MTMR7
12,GO_Biological_Process_2018,nuclear envelope reassembly (GO:0031468),2/18,0.001227,0.050700,0,0,44.477679,298.128023,PPP2R2A;CHMP7
10,GO_Biological_Process_2018,phospholipid metabolic process (GO:0006644),3/70,0.001104,0.050700,0,0,16.180461,110.173335,AGPAT5;LPL;FDFT1
9,GO_Biological_Process_2018,negative regulation of telomere maintenance (G...,2/17,0.001093,0.050700,0,0,47.445238,323.519069,TNKS;PINX1
11,GO_Biological_Process_2018,lipid biosynthetic process (GO:0008610),3/72,0.001198,0.050700,0,0,15.709881,105.686734,AGPAT5;LPL;FDFT1


### 8q cis effects

In [4]:
run_enrichr("pancancer_summary_8q_cis.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,positive regulation of protein ubiquitination ...,4/83,0.000205,0.113717,0,0,15.228999,129.312516,RNF139;RIPK2;DERL1;TSPYL5
1,GO_Biological_Process_2018,regulation of protein ubiquitination (GO:0031396),4/101,0.000435,0.120497,0,0,12.391753,95.913968,RNF139;RIPK2;DERL1;TSPYL5
2,GO_Biological_Process_2018,organonitrogen compound catabolic process (GO:...,3/56,0.000997,0.164517,0,0,16.792734,116.058223,RIDA;CPQ;ENPP2
3,GO_Biological_Process_2018,positive regulation of protein binding (GO:003...,3/60,0.001218,0.164517,0,0,15.611155,104.759453,RIPK2;DERL1;STK3
4,GO_Biological_Process_2018,positive regulation of protein modification by...,3/65,0.001535,0.164517,0,0,14.348580,92.963760,RIPK2;DERL1;TSPYL5
5,GO_Biological_Process_2018,mitotic recombination (GO:0006312),2/18,0.001782,0.164517,0,0,36.606618,231.725354,NSMCE2;RAD54B
93,GO_Biological_Process_2018,regulation of translation (GO:0006417),3/213,0.038734,0.212913,0,0,4.204691,13.669633,RIDA;RNF139;POLR2K
94,GO_Biological_Process_2018,negative regulation of cellular protein metabo...,2/89,0.038898,0.212913,0,0,6.708249,21.780407,RIDA;RNF139
95,GO_Biological_Process_2018,positive regulation of sequence-specific DNA b...,3/215,0.039646,0.212913,0,0,4.164602,13.442318,RIPK2;STK3;MTDH
96,GO_Biological_Process_2018,protein tetramerization (GO:0051262),2/90,0.039694,0.212913,0,0,6.631684,21.397502,DPYS;DECR1
