In [1]:
# --- SETUP GITHUB AND GCP ENVIRONMENT VARIABLES ---
# Ensure the following environmental variables are set in Colab user data:
# - GITHUB_PAT: GitHub Personal Access Token
# - GITHUB_EMAIL: GitHub email for commits
# - GITHUB_USER_NAME: GitHub username
# - GCP_EEG_PROJECT_ID: Google Cloud Project ID
# - GCP_EEG_BUCKET_NAME: (Optional) GCP bucket for EEG data

# Select environment
ENVIRONMENT = 'colab'   # Choose 'local' or 'colab'
BRANCH_NAME = 'main'
REPOSITORY_OWNER = 'tristan-day-research'
REPOSITORY = 'CIBMTR_cancer_outcome_predictions'
GOOGLE_DRIVE_DIR = 'CIBMTR_data'

if ENVIRONMENT == 'colab':
    from google.colab import userdata

    # Retrieve GitHub credentials from Colab user data
    token = userdata.get('GITHUB_PAT')
    github_email = userdata.get('GITHUB_EMAIL')
    github_username = userdata.get('GITHUB_USER_NAME')

    # Clone the repository (done here as the helper file isn't available yet)
    !git clone -b {BRANCH_NAME} https://{token}@github.com/{REPOSITORY_OWNER}/{REPOSITORY}.git

    # Change to correct directory
    %cd /content/{REPOSITORY}/

    # Load the helper file now that the repo is cloned
    # from src.setup import configure_environment
    from src import setup

    # Run full environment setup
    gcp_bucket_name, gcp_file_prefix, project_id, DATA_DIR = setup.configure_environment(environment=ENVIRONMENT, GOOGLE_DRIVE_DIR)


Cloning into 'CIBMTR_cancer_outcome_predictions'...
remote: Enumerating objects: 10, done.[K
remote: Counting objects: 100% (10/10), done.[K
remote: Compressing objects: 100% (8/8), done.[K
remote: Total 10 (delta 1), reused 0 (delta 0), pack-reused 0 (from 0)[K
Receiving objects: 100% (10/10), done.
Resolving deltas: 100% (1/1), done.
/content/CIBMTR_cancer_outcome_predictions
GCP Project Set
Git configured with your user data.


In [4]:
from google.colab import drive
import os

def setup_data_directory():
    # Mount Google Drive
    drive.mount('/content/drive')

    # Set up path to your data directory in Drive
    DATA_DIR = '/content/drive/MyDrive/your_project_folder/CIBMTR_data'

    # Create directory if it doesn't exist
    if not os.path.exists(DATA_DIR):
        os.makedirs(DATA_DIR)

    return DATA_DIR

# Usage
DATA_DIR = setup_data_directory()

# Example: List contents
files = os.listdir(DATA_DIR)
print(f"Files in data directory: {files}")

Mounted at /content/drive
Files in data directory: []
