# Regenerate Dynamic Features using python

## FGFR4 Dataset

### Data Init

In [1]:
import os

import numpy as np
import pandas as pd

path = os.getcwd()
# find the string 'project' in the path, return index
index_project = path.find('project')
# slice the path from the index of 'project' to the end
project_path = path[:index_project+7]
# set the working directory
os.chdir(project_path)
print(f'Project path set to: {os.getcwd()}')

Project path set to: c:\Github\ode-biomarker-project


In [2]:
# Bring in CCLE data
from PathLoader import PathLoader
from DataLink import DataLink
path_loader = PathLoader('data_config.env', 'current_user.env')
data_link = DataLink(path_loader, 'data_codes.csv')

In [3]:
# load in original ccle data
loading_code = 'generic-gdsc-1-FGFR_0939-LN_IC50-fgfr4_ccle_dynamic_features-true-Row'
# generic-gdsc-{number}-{drug_name}-{target_label}-{dataset_name}-{replace_index}-{row_index}
feature_data, label_data = data_link.get_data_using_code(loading_code)

In [5]:
# attempt load from loading code

loading_code = 'fgfr4_model_raw_simulation'
simulation_data = data_link.get_data_from_code(loading_code)

In [6]:
from get_dynamic_features import get_dynamic_features

### Run Program

In [7]:
all_species = simulation_data.columns[2:]
all_celllines = simulation_data['Cellline'].unique()

In [9]:
print('all species:', all_species)
print('all celllines:', all_celllines)

all species: Index(['pIGFR', 'pFGFR4', 'pERBB', 'pIRS', 'aPI3K', 'PIP3', 'pFRS2', 'aGrb2',
       'pAkt', 'aPDK1', 'amTORC1', 'pS6K', 'aSos', 'aShp2', 'aRas', 'aRaf',
       'pMEK', 'pERK', 'aGAB1', 'aGAB2', 'SPRY2', 'pSPRY2', 'PTP', 'aCbl',
       'FOXO', 'amTORC2'],
      dtype='object')
all celllines: ['ACH-001113' 'ACH-001289' 'ACH-001339' ... 'ACH-001858' 'ACH-001997'
 'ACH-000052']


In [14]:
selected_data = simulation_data[simulation_data['Cellline'] == 'ACH-001113']
specie_data = selected_data['pAkt']

In [15]:
print(specie_data)

0     5.692853
1     1.515733
2     4.342809
3     5.469497
4     6.159255
5     6.736439
6     7.201853
7     7.569843
8     7.863404
9     8.102042
10    8.299919
11    8.466945
12    8.610290
13    8.734981
14    8.844819
15    8.942670
16    9.030716
17    9.110656
18    9.183834
19    9.251323
20    9.314000
21    9.372586
22    9.427645
23    9.479653
24    9.529036
Name: pAkt, dtype: float64


## CDK4/6 Dataset