In [2]:
import kagglehub
import shutil
import os
import pickle
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from pathlib import Path


  from .autonotebook import tqdm as notebook_tqdm


In [7]:
def download_wesad_dataset():
    """Download WESAD dataset using kagglehub"""
    try:
        path = kagglehub.dataset_download("orvile/wesad-wearable-stress-affect-detection-dataset")
        print("Path to dataset files:", path)
        return path
    except Exception as e:
        print(f"Error downloading dataset: {e}")
        return None

download_path = download_wesad_dataset()

Path to dataset files: C:\Users\Joseph\.cache\kagglehub\datasets\orvile\wesad-wearable-stress-affect-detection-dataset\versions\1


In [4]:
def setup_project_structure():
    """Create organized project directory structure"""
    
    # Define paths
    project_root = r"C:\Users\Joseph\generative-health-models"
    
    # Create directory structure
    directories = [
        "data/raw/wesad",
        "data/processed",
        "data/synthetic", 
        "models/tc_multigan",
        "models/diffusion",
        "notebooks",
        "src/data",
        "src/models", 
        "src/evaluation",
        "results/figures",
        "results/metrics",
        "dashboard/backend",
        "dashboard/frontend"
    ]
    
    for directory in directories:
        dir_path = os.path.join(project_root, directory)
        os.makedirs(dir_path, exist_ok=True)
        print(f"Created: {dir_path}")
    
    return project_root

# Setup project structure
project_root = setup_project_structure()

Created: C:\Users\Joseph\generative-health-models\data/raw/wesad
Created: C:\Users\Joseph\generative-health-models\data/processed
Created: C:\Users\Joseph\generative-health-models\data/synthetic
Created: C:\Users\Joseph\generative-health-models\models/tc_multigan
Created: C:\Users\Joseph\generative-health-models\models/diffusion
Created: C:\Users\Joseph\generative-health-models\notebooks
Created: C:\Users\Joseph\generative-health-models\src/data
Created: C:\Users\Joseph\generative-health-models\src/models
Created: C:\Users\Joseph\generative-health-models\src/evaluation
Created: C:\Users\Joseph\generative-health-models\results/figures
Created: C:\Users\Joseph\generative-health-models\results/metrics
Created: C:\Users\Joseph\generative-health-models\dashboard/backend
Created: C:\Users\Joseph\generative-health-models\dashboard/frontend


In [5]:
def copy_wesad_data():
    """Copy WESAD data from kagglehub cache to project directory"""
    
    # Source path from kagglehub cache
    source_path = r"C:\Users\Joseph\.cache\kagglehub\datasets\orvile\wesad-wearable-stress-affect-detection-dataset\versions\1"
    
    # Target path in project
    target_path = os.path.join(project_root, "data", "raw", "wesad")
    
    try:
        # Copy contents
        if os.path.exists(source_path):
            shutil.copytree(source_path, target_path, dirs_exist_ok=True)
            print(f"Dataset copied to: {target_path}")
            
            # List contents to verify
            print("\nDataset contents:")
            for item in os.listdir(target_path):
                item_path = os.path.join(target_path, item)
                if os.path.isfile(item_path):
                    size_mb = os.path.getsize(item_path) / (1024*1024)
                    print(f"  📄 {item} ({size_mb:.1f} MB)")
                else:
                    print(f"  📁 {item}/")
                    
        else:
            print(f"Source path not found: {source_path}")
            
    except Exception as e:
        print(f"Error copying dataset: {e}")

# Copy the dataset
copy_wesad_data()

Dataset copied to: C:\Users\Joseph\generative-health-models\data\raw\wesad

Dataset contents:
  📁 WESAD/
