In [1]:
import pandas as pd
from gprofiler import GProfiler

In [2]:
delta_correlation_df = pd.read_csv('delta_correlation_df.csv')
delta_correlation_df

Unnamed: 0,Gene,Delta_Correlation,P_Value,FDR,Cancer
0,A1BG,-0.388745,5.489179e-02,1.428712e-01,CCRCC
1,A1CF,0.146993,1.086323e-03,5.807113e-03,CCRCC
2,A2M,-0.277035,2.970512e-02,8.941116e-02,CCRCC
3,AAAS,-0.044291,7.083291e-01,8.292938e-01,CCRCC
4,AACS,-0.128218,6.542873e-02,1.627560e-01,CCRCC
...,...,...,...,...,...
50299,ZXDC,0.087794,5.862270e-01,6.491477e-01,LUAD
50300,ZYG11B,0.707991,8.084098e-11,5.520566e-10,LUAD
50301,ZYX,0.472139,3.818601e-08,1.866439e-07,LUAD
50302,ZZEF1,0.418589,2.609770e-15,2.744540e-14,LUAD


In [3]:
background_genes = list(pd.unique(delta_correlation_df.Gene))

In [4]:
gp = GProfiler(return_dataframe=True)

In [5]:
sig_delta_corr = delta_correlation_df[delta_correlation_df.FDR < 0.05]
num_genes = pd.DataFrame(sig_delta_corr.groupby('Gene').size())
sig_genes = num_genes[num_genes[0] >=3].index
sig_delta_corr = sig_delta_corr[sig_delta_corr.Gene.isin(sig_genes)]
sig_delta_corr = sig_delta_corr.groupby('Gene').mean()
sig_delta_corr['Delta_Correlation'] = abs(sig_delta_corr.Delta_Correlation)
sig_delta_corr = sig_delta_corr.sort_values('Delta_Correlation', ascending = False)
sig_delta_corr.reset_index(inplace = True)
genes = list(sig_delta_corr.Gene)
pathway_enrichment = gp.profile(organism='hsapiens', query = genes, no_iea=True,
                       ordered=True, no_evidences=False, background= background_genes, sources = ['GO:BP'])
pathway_enrichment.to_csv('combinded_GO_pathway_enrichment_df.csv', index = False)

In [6]:
pathway_enrichment

Unnamed: 0,source,native,name,p_value,significant,description,term_size,query_size,intersection_size,effective_domain_size,precision,recall,query,parents,intersections,evidences
0,GO:BP,GO:0000278,mitotic cell cycle,2.537652e-10,True,"""Progression through the phases of the mitotic...",792,223,56,12414,0.251121,0.070707,query_1,[GO:0007049],"[TRIP13, ZWINT, PBK, MAPRE1, KIF11, CHEK1, NCA...","[[IMP], [IDA, IBA, TAS], [NAS], [TAS], [IDA, I..."
1,GO:BP,GO:1903047,mitotic cell cycle process,5.17429e-08,True,"""A process that is part of the mitotic cell cy...",702,743,106,12414,0.142665,0.150997,query_1,"[GO:0000278, GO:0022402]","[TRIP13, ZWINT, MAPRE1, KIF11, CHEK1, NCAPD3, ...","[[IMP], [IDA, IBA, TAS], [TAS], [IDA, IMP, IBA..."
2,GO:BP,GO:0007049,cell cycle,1.03282e-06,True,"""The progression of biochemical and morphologi...",1143,223,64,12414,0.286996,0.055993,query_1,[GO:0009987],"[TRIP13, ZWINT, PBK, MAPRE1, KIF11, CHEK1, NCA...","[[IMP, ISS, IBA], [IDA, IBA, TAS], [NAS], [IBA..."
3,GO:BP,GO:0022402,cell cycle process,1.700306e-06,True,"""The cellular process that ensures successive ...",969,746,134,12414,0.179625,0.138287,query_1,"[GO:0007049, GO:0009987]","[TRIP13, ZWINT, MAPRE1, KIF11, CHEK1, NCAPD3, ...","[[IMP, ISS, IBA], [IDA, IBA, TAS], [IBA, TAS],..."
4,GO:BP,GO:0006271,DNA strand elongation involved in DNA replication,3.932273e-06,True,"""The process in which an existing DNA strand i...",18,1575,15,12414,0.009524,0.833333,query_1,"[GO:0006261, GO:0022616]","[GINS3, PCNA, GINS1, MCM3, MCM7, MCM4, GINS2, ...","[[TAS], [IBA], [IBA, TAS], [IBA], [IBA], [IBA]..."
5,GO:BP,GO:0007052,mitotic spindle organization,8.815392e-06,True,"""A process that is carried out at the cellular...",172,223,20,12414,0.089686,0.116279,query_1,"[GO:0007051, GO:1902850]","[ZWINT, MAPRE1, KIF11, TPX2, KIFC1, PRC1, NDC8...","[[TAS], [TAS], [IDA, IMP, IBA, TAS], [IDA, ISS..."
6,GO:BP,GO:0140014,mitotic nuclear division,2.101378e-05,True,"""A mitotic cell cycle process comprising the s...",269,487,39,12414,0.080082,0.144981,query_1,"[GO:0000280, GO:1903047]","[TRIP13, ZWINT, KIF11, CHEK1, NCAPD3, TPX2, KI...","[[IMP], [IDA, IBA], [IDA, IMP, IBA], [IDA], [I..."
7,GO:BP,GO:0051276,chromosome organization,2.257688e-05,True,"""A process that is carried out at the cellular...",823,770,116,12414,0.150649,0.140948,query_1,[GO:0006996],"[DHX36, TRIP13, ZWINT, NSD3, RIOX1, CHEK1, NCA...","[[IDA, IMP], [IMP, ISS], [IDA, IBA], [IDA, IMP..."
8,GO:BP,GO:1902850,microtubule cytoskeleton organization involved...,3.176894e-05,True,"""Any microtubule cytoskeleton organization tha...",183,223,20,12414,0.089686,0.10929,query_1,"[GO:0000226, GO:1903047]","[ZWINT, MAPRE1, KIF11, TPX2, KIFC1, PRC1, NDC8...","[[TAS], [TAS], [IDA, IMP, IBA, TAS], [IDA, ISS..."
9,GO:BP,GO:0000075,cell cycle checkpoint signaling,3.743448e-05,True,"""A signaling process that controls cell cycle ...",146,230,19,12414,0.082609,0.130137,query_1,"[GO:0035556, GO:1901988]","[TRIP13, ZWINT, CHEK1, NDC80, USP28, BLM, TP53...","[[IMP, IBA], [IDA], [IDA, IMP], [IMP], [IMP, I..."
