# Cis effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the cis effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import cptac.utils as ut
import gseapy as gp

In [2]:
def run_enrichr(input_file):

    input_df = pd.read_csv(input_file, sep="\t")
    protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

## Now with all data sources

### 8p cis effects

In [3]:
run_enrichr("pancancer_summary_8p.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,nuclear envelope reassembly (GO:0031468),3/18,0.000014,0.071137,0,0,62.893082,703.190947,REEP4;PPP2R2A;CHMP7
2,GO_Biological_Process_2018,mitotic nuclear envelope reassembly (GO:0007084),2/10,0.000306,0.520278,0,0,75.471698,610.744390,REEP4;PPP2R2A
1,GO_Biological_Process_2018,peptidyl-serine dephosphorylation (GO:0070262),2/10,0.000306,0.780417,0,0,75.471698,610.744390,PPP2CB;PPP2R2A
290,GO_Biological_Process_2018,regulation of protein targeting to mitochondri...,1/88,0.208653,1.000000,0,0,4.288165,6.719904,BAG4
289,GO_Biological_Process_2018,regulation of peptidyl-tyrosine phosphorylatio...,1/85,0.202301,1.000000,0,0,4.439512,7.094331,CNOT7
288,GO_Biological_Process_2018,activation of GTPase activity (GO:0090630),1/84,0.200173,1.000000,0,0,4.492363,7.226304,ARHGEF10
287,GO_Biological_Process_2018,cellular response to molecule of bacterial ori...,1/84,0.200173,1.000000,0,0,4.492363,7.226304,DEFA4
286,GO_Biological_Process_2018,protein modification process (GO:0036211),1/84,0.200173,1.000000,0,0,4.492363,7.226304,MSRA
285,GO_Biological_Process_2018,positive regulation of cell cycle arrest (GO:0...,1/82,0.195899,1.000000,0,0,4.601933,7.501870,CNOT7
284,GO_Biological_Process_2018,positive regulation of transmembrane receptor ...,1/82,0.195899,1.000000,0,0,4.601933,7.501870,RBPMS


### 8q cis effects

In [4]:
run_enrichr("pancancer_summary_8q.tsv")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
10,GO_Biological_Process_2018,retinal metabolic process (GO:0042574),2/11,0.001429,0.662714,0,0,34.965035,229.059456,SDR16C5;RDH10
12,GO_Biological_Process_2018,"regulation of protein import into nucleus, tra...",2/12,0.001708,0.670630,0,0,32.051282,204.236281,PARP10;UBR5
2,GO_Biological_Process_2018,RNA phosphodiester bond hydrolysis (GO:0090501),3/28,0.000407,0.692438,0,0,20.604396,160.848368,CPSF1;POP1;LACTB2
11,GO_Biological_Process_2018,retinol metabolic process (GO:0042572),2/12,0.001708,0.726516,0,0,32.051282,204.236281,SDR16C5;RDH10
9,GO_Biological_Process_2018,regulation of nuclear-transcribed mRNA poly(A)...,2/11,0.001429,0.728985,0,0,34.965035,229.059456,AGO2;PABPC1
1,GO_Biological_Process_2018,peptide biosynthetic process (GO:0043043),6/174,0.000298,0.761311,0,0,6.631300,53.827255,COPS5;AGO2;RPS20;RPL8;MRPL13;RPL7
17,GO_Biological_Process_2018,cytoplasmic translation (GO:0002181),3/54,0.002795,0.792337,0,0,10.683761,62.820301,RPS20;RPL8;RPL7
14,GO_Biological_Process_2018,"mitochondrial electron transport, ubiquinol to...",2/14,0.002340,0.795952,0,0,27.472527,166.421694,UQCRB;CYC1
8,GO_Biological_Process_2018,positive regulation of nuclear-transcribed mRN...,2/11,0.001429,0.809984,0,0,34.965035,229.059456,AGO2;PABPC1
18,GO_Biological_Process_2018,positive regulation of nuclear-transcribed mRN...,2/16,0.003064,0.823040,0,0,24.038462,139.132089,AGO2;PABPC1
