# Trans effects enrichment - Enrichr

This notebook will use Enrichr to look for pathways enriched for proteins that came up across multiple cancers in the trans effects analysis.

## Setup

In [1]:
import pandas as pd
import numpy as np
import gprofiler
import gseapy as gp
import os
import IPython.display

In [2]:
def run_enrichr_reactome(input_file, cancer_type=None):

    input_df = pd.read_csv(input_file, sep="\t")
    
    if cancer_type is not None:
        cancer_df = input_df[input_df["cancers"].str.contains(cancer_type)]
        protein_list = cancer_df["protein"].tolist()
    else:
        protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=os.path.join("gene_set_libraries", "ReactomePathways.gmt"),
        background="hsapiens_gene_ensembl",
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

In [3]:
def run_enrichr_go(input_file, cancer_type=None):

    input_df = pd.read_csv(input_file, sep="\t")
    
    if cancer_type is not None:
        cancer_df = input_df[input_df["cancers"].str.contains(cancer_type)]
        protein_list = cancer_df["protein"].tolist()
    else:
        protein_list = input_df["protein"].tolist()

    enr = gp.enrichr(
        gene_list=protein_list,
        gene_sets=["GO_Biological_Process_2018"],
        organism='Human',
        description='test_name',
        outdir=None,
        cutoff=0.05
    )
    
    return enr.res2d.sort_values(by="Adjusted P-value")

### 8q trans effects in BRCA

In [4]:
run_enrichr_reactome("pancancer_summary_8q_trans.tsv", cancer_type="brca")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Genes
721,CUSTOM140678194177440,Mitochondrial translation elongation (R-HSA-53...,66/91,2.317373e-55,3.318478e-52,MRPL47;MRPS15;MRPS34;DAP3;MRPL58;PTCD3;MRPS31;...
722,CUSTOM140678194177440,Mitochondrial translation initiation (R-HSA-53...,65/91,7.967065e-54,3.802946e-51,MRPL47;MRPS15;MRPS34;DAP3;MRPL58;PTCD3;MRPS31;...
720,CUSTOM140678194177440,Mitochondrial translation (R-HSA-5368287),67/97,6.970485e-54,3.802946e-51,MRPL47;MRPS15;MRPS34;DAP3;MRPL58;PTCD3;MRPS31;...
723,CUSTOM140678194177440,Mitochondrial translation termination (R-HSA-5...,64/91,2.595649e-52,9.292422e-50,MRPL47;MRPS15;MRPS34;DAP3;MRPL58;PTCD3;MRPS31;...
1334,CUSTOM140678194177440,Translation (R-HSA-72766),70/303,1.050871e-18,3.009695e-16,MRPL47;MRPS15;MRPS34;DAP3;MRPL58;PTCD3;MRPS31;...
683,CUSTOM140678194177440,Membrane Trafficking (R-HSA-199991),108/611,1.280923e-18,3.057136e-16,PPP6C;RAB33B;TRAPPC1;COG6;COPE;SEC24D;AP2M1;SN...
168,CUSTOM140678194177440,"Cell Cycle, Mitotic (R-HSA-69278)",98/530,2.347198e-18,4.801697e-16,SMC1A;PPP2CB;CDCA5;PSME3;CDC20;NCAPG;NUP50;POL...
166,CUSTOM140678194177440,Cell Cycle (R-HSA-1640170),108/662,4.734794e-16,8.475281e-14,PPP6C;SMC1A;PPP2CB;CDCA5;PSME3;CDC20;NCAPG;CHT...
1379,CUSTOM140678194177440,Vesicle-mediated transport (R-HSA-5653656),115/730,6.872895e-16,1.093554e-13,PPP6C;RAB33B;TRAPPC1;COG6;COPE;SEC24D;AP2M1;SN...
702,CUSTOM140678194177440,Metabolism of proteins (R-HSA-392499),239/2017,1.059699e-15,1.517490e-13,PPP6C;MRPS34;MRPS15;SMC1A;CPA3;MRPL58;PSME3;RA...


In [5]:
run_enrichr_go("pancancer_summary_8q_trans.tsv", cancer_type="brca")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,mitochondrial translational elongation (GO:007...,66/87,6.015934e-59,3.069931e-55,0,0,11.074755,1.484661e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS11;MRPS12;MRPL38...
1,GO_Biological_Process_2018,mitochondrial translation (GO:0032543),70/107,3.727789e-55,9.511453e-52,0,0,9.550447,1.196923e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS11;MRPS12;MRPL38...
2,GO_Biological_Process_2018,mitochondrial translational termination (GO:00...,64/89,1.188620e-54,2.021843e-51,0,0,10.497827,1.303482e+03,MRPS17;MRPS15;MRPS16;MRPS11;MRPS12;MRPL38;MRPL...
3,GO_Biological_Process_2018,translational termination (GO:0006415),65/96,9.109382e-53,1.162129e-49,0,0,9.884428,1.184428e+03,MRPS17;MRPS15;MRPS16;MRPS11;MRPS12;MRPL38;MRPL...
4,GO_Biological_Process_2018,translational elongation (GO:0006414),67/105,9.506891e-52,9.702733e-49,0,0,9.315259,1.094379e+03,MRPS17;MRPS15;GFM1;MRPS16;MRPS11;MRPS12;MRPL38...
5,GO_Biological_Process_2018,mitochondrial gene expression (GO:0140053),26/45,2.921079e-19,2.484378e-16,0,0,8.434712,3.599696e+02,MRPS17;MRPS15;MRPS16;MRPS11;MRPS12;MRPS34;MRPL...
6,GO_Biological_Process_2018,Golgi vesicle transport (GO:0048193),64/271,8.995753e-19,6.557904e-16,0,0,3.447626,1.432570e+02,SNAP23;GCC2;MIA3;KIF11;KIF15;ACTR1A;CTSC;SCYL1...
7,GO_Biological_Process_2018,mitotic sister chromatid segregation (GO:0000070),29/82,4.680762e-14,2.985741e-11,0,0,5.162898,1.584634e+02,CDCA5;AKAP8L;KIF14;NCAPG;CDCA8;PDS5A;SMC4;NCAP...
8,GO_Biological_Process_2018,ribosome biogenesis (GO:0042254),50/226,9.081594e-14,5.149264e-11,0,0,3.229766,9.698967e+01,DDX47;PAK1IP1;RPP30;WDR3;MRPS12;WDR43;RRP9;FBL...
9,GO_Biological_Process_2018,rRNA processing (GO:0006364),46/202,2.953424e-13,1.507132e-10,0,0,3.324420,9.591165e+01,DDX27;DDX47;RPP30;WDR3;MRPS12;ISG20L2;NAT10;TF...


### 8q trans effects in LSCC

In [6]:
run_enrichr_reactome("pancancer_summary_8q_trans.tsv", cancer_type="lscc")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Genes
391,CUSTOM140678188855376,Immune System (R-HSA-168256),167/2225,1.535807e-26,1.649457e-23,ICAM1;ELMO1;FCGR1A;ELMO2;NUP50;F13A1;MYO9B;TAP...
67,CUSTOM140678188855376,Asparagine N-linked glycosylation (R-HSA-446203),42/286,1.976548e-16,1.061406e-13,GMPPB;EDEM3;NAGK;DCTN6;MCFD2;DCTN5;COPG1;COPE;...
41,CUSTOM140678188855376,Adaptive Immune System (R-HSA-1280218),75/828,5.699210e-16,2.040317e-13,PSMB6;RBCK1;PPP3R1;ICAM1;RNF130;PIK3CD;DCTN6;F...
494,CUSTOM140678188855376,Membrane Trafficking (R-HSA-199991),59/611,6.062932e-14,1.627897e-11,DENND1C;KIF13B;DENND1B;CYTH4;DCTN6;AGPAT3;MCFD...
405,CUSTOM140678188855376,Innate Immune System (R-HSA-168249),86/1141,1.614778e-13,3.468544e-11,ELMO1;FCGR1A;ELMO2;MYO9B;CAPZA1;SURF4;LIMK1;IQ...
1034,CUSTOM140678188855376,Vesicle-mediated transport (R-HSA-5653656),64/730,4.195528e-13,7.509996e-11,HYOU1;DENND1C;KIF13B;DENND1B;CYTH4;DCTN6;AGPAT...
926,CUSTOM140678188855376,TCR signaling (R-HSA-202403),21/126,6.719059e-10,1.030896e-07,PSMB6;PSMB5;PRKCQ;PSMB10;CD4;PSMB9;INPP5D;CSK;...
167,CUSTOM140678188855376,Cytokine Signaling in Immune system (R-HSA-128...,64/875,9.492464e-10,1.274363e-07,PSMB6;ICAM1;TRIM26;PIK3CD;SOD2;FCGR1A;IRF8;PSM...
871,CUSTOM140678188855376,Signaling by Rho GTPases (R-HSA-194315),39/405,1.404010e-09,1.675452e-07,FGD2;ARHGAP18;PPP1R12A;ARHGAP25;ABR;ACTR3;PPP2...
242,CUSTOM140678188855376,ER to Golgi Anterograde Transport (R-HSA-199977),21/136,2.830379e-09,3.039827e-07,DCTN6;MCFD2;DCTN5;COPG1;COPE;CAPZA2;CAPZA1;LMA...


In [7]:
run_enrichr_go("pancancer_summary_8q_trans.tsv", cancer_type="lscc")

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,GO_Biological_Process_2018,T cell receptor signaling pathway (GO:0050852),28/163,1.349705e-13,6.887546e-10,0,0,5.568206,165.006644,DENND1B;WAS;PIK3CD;CD3E;PSMB10;PSMB6;PSMB7;PSM...
1,GO_Biological_Process_2018,antigen receptor-mediated signaling pathway (G...,31/257,9.603486e-11,2.450329e-07,0,0,3.909970,90.188575,DENND1B;WAS;PIK3CD;CD3E;PSMB10;PSMB6;CD79A;PSM...
2,GO_Biological_Process_2018,Golgi vesicle transport (GO:0048193),31/271,3.670415e-10,6.243375e-07,0,0,3.707979,80.557864,DCTN6;ARF4;DCTN5;COPA;MCFD2;SAR1B;COPB1;KIF15;...
3,GO_Biological_Process_2018,vesicle-mediated transport (GO:0016192),39/410,5.069210e-10,6.467045e-07,0,0,3.083370,65.992329,DENND1C;VPS29;DENND1B;STX12;RAB5C;WIPF1;TGFBRA...
4,GO_Biological_Process_2018,positive regulation of T cell activation (GO:0...,15/68,1.800822e-09,1.837919e-06,0,0,7.150348,143.972418,TFRC;DOCK8;CD3E;AIF1;ZAP70;HLA-DMB;PTPRC;CD6;L...
5,GO_Biological_Process_2018,T cell activation (GO:0042110),16/88,1.023948e-08,8.708676e-06,0,0,5.893620,108.425019,PIK3CD;RHOH;MSN;CD3E;PIK3CG;DDOST;CD2;ZAP70;PP...
6,GO_Biological_Process_2018,transmembrane receptor protein tyrosine kinase...,35/396,2.618776e-08,1.909088e-05,0,0,2.864954,50.016296,ATP6V1A;ARPC1B;CD3E;GRAP2;BLNK;ATP6V1H;NCKAP1L...
7,GO_Biological_Process_2018,ER to Golgi vesicle-mediated transport (GO:000...,22/180,4.051468e-08,2.584330e-05,0,0,3.961822,67.436563,NSF;DCTN6;ARF4;DCTN5;COPA;MCFD2;SAR1B;COPB1;CO...
8,GO_Biological_Process_2018,protein transport (GO:0015031),30/326,1.083905e-07,6.145739e-05,0,0,2.982967,47.839414,ATP6V1A;VPS29;STX12;COPA;TBC1D9B;RAB5C;TFRC;HS...
9,GO_Biological_Process_2018,"retrograde vesicle-mediated transport, Golgi t...",14/80,1.409860e-07,7.194514e-05,0,0,5.672609,89.483175,NSF;ARF4;COPA;COPB1;SURF4;COPZ1;KIF15;TAPBP;AR...
