In [1]:
# Jupyter notebook in Jupytext format

## Initialisation

In [2]:
import os

path = os.getcwd()
# find the string 'project' in the path, return index
index_project = path.find("project")
# slice the path from the index of 'project' to the end
project_path = path[: index_project + 7]
# set the working directory
os.chdir(project_path)
print(f"Project path set to: {os.getcwd()}")

Project path set to: c:\Github\ode-biomarker-project


In [3]:
from PathLoader import PathLoader #noqa: E402

path_loader = PathLoader("data_config.env", "current_user.env")

In [4]:
from DataLink import DataLink #noqa: E402

data_link = DataLink(path_loader, "data_codes.csv")

In [5]:
folder_name = "ThesisResult2-1-DynamicFeatures"
exp_id = "v1"

if not os.path.exists(f"{path_loader.get_data_path()}data/results/{folder_name}/{exp_id}"):
    os.makedirs(f"{path_loader.get_data_path()}data/results/{folder_name}/{exp_id}")

file_save_path = f"{path_loader.get_data_path()}data/results/{folder_name}/{exp_id}/"

### Loading CDK4/6 RNASeq data and Dynamic Features

In [6]:
# Load Transcriptomics Palbociclib dataset
loading_code = "ccle-gdsc-2-Palbociclib-LN_IC50"
cdk46_rnaseq_feature_data, cdk46_rnaseq_label_data = data_link.get_data_using_code(
    loading_code
)

print(f"RNASeq feature data shape: {cdk46_rnaseq_feature_data.shape}")
print(f"RNASeq label data shape: {cdk46_rnaseq_label_data.shape}")

RNASeq feature data shape: (584, 19221)
RNASeq label data shape: (584,)


In [7]:

feature_data_dynamic, label_data_dynamic = data_link.get_data_using_code('generic-gdsc-2-Palbociclib-LN_IC50-cdk46_ccle_dynamic_features_v4_ccle-true-Unnamed: 0')
print(f"Dynamic dataset shape: {feature_data_dynamic.shape}")
print(f"Dynamic label shape: {label_data_dynamic.shape}")

Dynamic dataset shape: (584, 590)
Dynamic label shape: (584,)


### Loading CDK4/6 Proteomics data and Dynamic Features

In [8]:
# Load Proteomics Palbociclib dataset
loading_code = "goncalves-gdsc-2-Palbociclib-LN_IC50-sin"
proteomic_feature_data, proteomic_label_data = data_link.get_data_using_code(
    loading_code
)

print(f"Proteomic feature data shape: {proteomic_feature_data.shape}")
print(f"Proteomic label data shape: {proteomic_label_data.shape}")

Proteomic feature data shape: (737, 6692)
Proteomic label data shape: (737,)


In [9]:

feature_data_dynamic, label_data_dynamic = data_link.get_data_using_code('generic-gdsc-2-Palbociclib-LN_IC50-cdk46_ccle_dynamic_features_v4_ccle_proteomics-true-Unnamed: 0')
print(f"Proteomic Dynamic dataset shape: {feature_data_dynamic.shape}")
print(f"Proteomic Dynamic label shape: {label_data_dynamic.shape}")

Proteomic Dynamic dataset shape: (255, 590)
Proteomic Dynamic label shape: (255,)


### Loading FGFR4 RNASeq data and Dynamic Features

In [10]:
# Load FGFR4 RNASeq dataset
loading_code = "ccle-gdsc-1-FGFR_0939-LN_IC50"
fgfr4_RNASeq_feature_data, fgfr4_RNASeq_label_data = data_link.get_data_using_code(
    loading_code
)

print(f"feature data shape: {fgfr4_RNASeq_feature_data.shape}")
print(f"label data shape: {fgfr4_RNASeq_label_data.shape}")

feature data shape: (667, 19221)
label data shape: (667,)


In [12]:

feature_data_dynamic, label_data_dynamic = data_link.get_data_using_code('generic-gdsc-1-FGFR_0939-LN_IC50-fgfr4_ccle_dynamic_features_v2-true-Unnamed: 0')
print(f"Dynamic dataset shape: {feature_data_dynamic.shape}")
print(f"Dynamic label shape: {label_data_dynamic.shape}")

Dynamic dataset shape: (665, 260)
Dynamic label shape: (665,)


### Loading FGFR4 Proteomic data and Dynamic Features

In [13]:
# Load FGFR4 RNASeq dataset
loading_code = "goncalves-gdsc-1-FGFR_0939-LN_IC50-sin"
fgfr4_RNASeq_feature_data, fgfr4_RNASeq_label_data = data_link.get_data_using_code(
    loading_code
)

print(f"feature data shape: {fgfr4_RNASeq_feature_data.shape}")
print(f"label data shape: {fgfr4_RNASeq_label_data.shape}")

feature data shape: (891, 6692)
label data shape: (891,)


In [14]:

feature_data_dynamic, label_data_dynamic = data_link.get_data_using_code('generic-gdsc-1-FGFR_0939-LN_IC50-fgfr4_dynamic_features_v3_proteomic-true-Row')
print(f"Dynamic dataset shape: {feature_data_dynamic.shape}")
print(f"Dynamic label shape: {label_data_dynamic.shape}")

Dynamic dataset shape: (203, 260)
Dynamic label shape: (203,)


## Functions