In [1]:
# Loading the code
from numpy import load
import numpy as np

data = load('integrated_eeg_dataset.npz')

In [2]:
print("--- X_raw (Raw EEG signals) ---")
print(f"  Shape: {data['X_raw'].shape} = (samples, time_points, channels)")
print(f"  dtype: {data['X_raw'].dtype}")
print(f"  Channels: 19 EEG electrodes")
print(f"  Time points: 128 per sample")

--- X_raw (Raw EEG signals) ---
  Shape: (101916, 128, 19) = (samples, time_points, channels)
  dtype: float64
  Channels: 19 EEG electrodes
  Time points: 128 per sample


In [3]:
print("=== EEG Alzheimer Dataset Overview ===\n")

print(f"Total samples: {data['X_raw'].shape[0]}")
print(f"Keys: {list(data.files)}\n")

=== EEG Alzheimer Dataset Overview ===

Total samples: 101916
Keys: ['X_raw', 'y_labels', 'X_features']



In [4]:
print("\n--- y_labels (Sample metadata) ---")
print(f"  Shape: {data['y_labels'].shape}")
print(f"  Columns: {data['y_labels'][0]}")
print(f"  Unique diagnoses: {np.unique(data['y_labels'][:, 2])}")


--- y_labels (Sample metadata) ---
  Shape: (101916, 3)
  Columns: ['0' '10' 'AD-Auditory']
  Unique diagnoses: ['AD-Auditory' 'ADFSU' 'ADFTD' 'ADSZ' 'APAVA-19']


In [5]:
print("\n--- X_features (Extracted features) ---")
print(f"  Shape: {data['X_features'].shape} = (samples, features)")
print(f"  dtype: {data['X_features'].dtype}")


--- X_features (Extracted features) ---
  Shape: (101916, 76) = (samples, features)
  dtype: float64


In [6]:
print("\n--- Sample breakdown ---")
for label in np.unique(data['y_labels'][:, 2]):
    count = np.sum(data['y_labels'][:, 2] == label)
    print(f"  {label}: {count} samples ({100*count/len(data['y_labels']):.1f}%)")


--- Sample breakdown ---
  AD-Auditory: 30654 samples (30.1%)
  ADFSU: 2490 samples (2.4%)
  ADFTD: 63783 samples (62.6%)
  ADSZ: 633 samples (0.6%)
  APAVA-19: 4356 samples (4.3%)
