# Mine DepMap data set for Cell Cycle Regulators (n=4,672)
### Aim:
Search the GO terms from the GSEA results for communities that are enriched in specific cell cycle terms
<br>
### Output:
DF of genes with communities enriched in cell cycle terms exported as a CSV file

In [1]:
# Import packages and DepMap tools
import os
from DepMapTools.DataImport import SaveLoad
from DepMapTools.GeneOntology import OntologyAnalysis
from DepMapTools.Networks import Permutations
from DepMapTools.Mine import MineData

In [2]:
# Instantiate classes
sl = SaveLoad()
md = MineData()
oa = OntologyAnalysis()
pm = Permutations()

In [3]:
# Define dictionary path
PRD = ".."
k_path = os.path.join(PRD,
                      '2_Community_Analysis/pickle_files/chronos_k_community_funk.pickle')
k_emp = os.path.join(PRD,
                     '2_Community_Analysis/pickle_files/chronos_k_permute_funk.pickle')

In [4]:
# Load community analysis dictionaries
k_dict = sl.load_dict_pickle(k_path)
k_emp = sl.load_dict_pickle(k_emp)

In [5]:
# Make final dict
funk = pm.make_sig_dict(k_dict, k_emp)

In [6]:
# Define term and score mapping dictionary
term_dict = {'G1/S': 7, 'G2/M': 8, 'metaphase/anaphase': 4}

In [7]:
# Mine the dataset using the term dictionary
mine_df = md.mine_terms(term_dict, funk, p_val=1)

Searching Terms
--------------------
G1/S : 2 genes
G2/M : 2 genes
metaphase/anaphase : 2 genes
--------------------
Compiling DF
--------------------
Complete


In [8]:
# Export df to CSV
PRD = ".."
export_path = os.path.join(PRD, '4_Mine_CellCycle/identified_genes_final.csv')
mine_df.to_csv(fr'{export_path}', index = False)