In [1]:
import numpy as np
import torch
import copy
from metabci.brainda.algorithms.deep_learning import EEGNet_Sparse
from metabci.brainda.algorithms.utils.model_selection import (
    set_random_seeds,
    generate_kfold_indices, match_kfold_indices)
from metabci.brainda.datasets import Wang2016, BETA
# 三个SSVEP Datasets：Nakanishi2015、Wang2016、BETA
from metabci.brainda.paradigms import SSVEP
from skorch.helper import predefined_split

In [2]:
#**************************************************
# BETA数据集读取处理
#**************************************************

BETA_dataset = BETA()
subject_list = list(range(1, 71))  # 被试编号从1到70
for s in subject_list:
    BETA_dataset.data_path(subject=s, path="E:\\MetaBCI-master\\mne_data")  # 依次为每个被试设置路径
BETA_subjects_2S = list(range(1, 16))  # 使用S1–S15被试进行预训练，2s窗
BETA_subjects_3S = list(range(16, 36))  # 使用S16–S70被试进行预训练，3s窗
events = BETA_dataset.events.keys()
freq_list = [str(BETA_dataset.get_freq(event)) for event in events]  # 获得所有刺激的频率
BETA_freq_map = {i: freq for i, freq in enumerate(freq_list)}  # 标签到频率的映射
print(freq_list) # 输出频率显示

# BETA数据集论文在 2.6 Data Preprocessing 章节有以下说明
# 对于S1–S15的被试，时间窗为 2秒
# 对于S16–S70的被试，时间窗为 3秒，试次总长度为 4秒
paradigm_2s = SSVEP(
    # In order to validate the data quality by visual inspection,
    # nine parietal and occipital channels(Pz,PO3,PO5,PO4,PO6,POz,O1,Oz,and O2) were selected。
    channels=['POZ', 'PZ', 'PO3', 'PO5', 'PO4', 'PO6', 'O1', 'OZ', 'O2'],  # 选择电极通道
    intervals=[(0.14, 1.14)],  # 分析时间窗最长-0.5-2.5s ,每个试次包含事件开始前0.5秒的数据，以及事件时间窗后0.5秒的数据。对于S1–S15的被试，时间窗为 2秒
    events=freq_list,  # 选择所有刺激频率
    srate=250  # 采样率
)
paradigm_3s = SSVEP(
    # In order to validate the data quality by visual inspection,
    # nine parietal and occipital channels(Pz, PO3, PO5, PO4, PO6, POz, O1, Oz,and O2) were selected。
    channels=['POZ', 'PZ', 'PO3', 'PO5', 'PO4', 'PO6', 'O1', 'OZ', 'O2'],  # 选择电极通道
    intervals=[(0.14, 1.14)],  # 分析时间窗最长-0.5-3.5s ,每个试次包含事件开始前0.5秒的数据，以及事件时间窗后0.5秒的数据。对于S16–S70的被试，时间窗为 3秒，试次总长度为 4秒
    events=freq_list,  # 选择所有刺激频率
    srate=250  # 采样率
)

# BETA数据集，已经通过matlab的eegfit，进行了3-90HZ的带通滤波，故此处不再进行滤波处理
# BETA_wof数据集没有进行滤波处理，链接已经
# 在tsinghua.py把BETA_URL做以下修改即可使用未滤波的版本
# BETA_URL = "https://bci.med.tsinghua.edu.cn/upload/liubingchuan_BETA_wof/"


# 数据存储为一个四维张量 [channel, time point, block, condition]
#                    [   64,       750,      4,      40    ]


# 获取训练数据
X_2s, y_2s, meta_2s = paradigm_2s.get_data(
    BETA_dataset,
    subjects=BETA_subjects_2S,
    return_concat=True,
    n_jobs=None,
    verbose=False
)

# 获取训练数据
X_3s, y_3s, meta_3s = paradigm_3s.get_data(
    BETA_dataset,
    subjects=BETA_subjects_3S,
    return_concat=True,
    n_jobs=None,
    verbose=False
)

# 选择使用的BETA数据
# 2s和3s的数据shape不同，不能直接拼接，是否填0补充相同大小拼接？
X_BETA = X_3s
y_BETA = y_3s
meta_BETA = meta_3s



--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S1-S10.tar.gz
--------ssssss, /upload/liubingchuan/S11-S20.tar.gz
--------ssssss, /upload/liubingchuan/S11-S20.tar.gz
--------ssssss, /upload/liubingchuan/S11-S20.tar.gz
--------ssssss, /upload/liubingchuan/S11-S20.tar.gz
--------ssssss, /upload/liubingchuan/S11-S20.tar.gz
--------ssssss, /upload/liubingchuan/S11-S20.tar.gz
--------ssssss, /upload/liubingchuan/S11-S20.tar.gz
--------ssssss, /upload/liubingchuan/S11-S20.tar.gz
--------ssssss, /upload/liubingchuan/S11-S20.tar.gz
--------ssssss, /uploa

In [3]:
#**************************************************
# BETA数据集  EEGNET网络
#!python3.8 BETA_freezing.py #BETA冻结 1e-4学习率，S16~S36  F1=40,D=2,F2=80,Epsilon=20,shared_ratio=0.3,alpha=1.0
# 所有折准确率: [0.38, 0.44, 0.4375, 0.41875]
# 平均准确率： 0.4190625
#**************************************************

# 设置device（如果GPU可用则使用GPU，否则使用CPU）
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)

# 设置随机种子
set_random_seeds(42)
kfold = 4
print(X_BETA.shape)  # (8800, 9, 750)  8800= 40刺激 x 4个试次 x 55人
indices = generate_kfold_indices(meta_BETA, kfold=kfold)

# 预训练阶段
F1 = 20
D = 2
F2 = 40
n_channels = X_BETA.shape[1] # 输入信号的通道数
n_samples = X_BETA.shape[2] # 输入信号的采样点数，时长*采样率
n_classes = 40
time_kernel_length = 50
shared_ratio = 0
alpha = 1.0
epsilon = 30
BETA_save_path = "BETA_eegnet_Sparse_dropout_1s_0.0.pth"

pre_accs = []
best_test_acc = -1
best_state_dict = None

for k in range(kfold):
    # 初始化模型
    estimator = EEGNet_Sparse(F1,D,F2,n_channels,n_samples,n_classes,time_kernel_length,shared_ratio,alpha,epsilon)
    estimator.set_params(optimizer__lr=1e-3,device=device)  #  optimizer__lr=3e-3,默认1e-2
    train_ind, validate_ind, test_ind = match_kfold_indices(k, meta_BETA, indices)
    # 合并train_ind和validate_ind作为新的训练集索引
    new_train_ind = np.concatenate([train_ind, validate_ind])
    new_valid_ind = test_ind  # 用test_ind作为验证集
    new_test_ind = test_ind   # 用test_ind作为测试集

    print(f"train_ind数量: {len(new_train_ind)}, validate_ind数量: {len(new_valid_ind)}, test_ind数量: {len(new_test_ind)}")
    valid_ds = torch.utils.data.TensorDataset(
        torch.tensor(X_BETA[new_valid_ind], dtype=torch.float64),
        torch.tensor(y_BETA[new_valid_ind], dtype=torch.long)
    )
    estimator.set_params(train_split=predefined_split(valid_ds))
    estimator.fit(X_BETA[new_train_ind], y_BETA[new_train_ind])
    # 测试集评估
    p_labels = estimator.predict(X_BETA[new_test_ind])
    p_freqs = [BETA_freq_map [label] for label in p_labels]
    y_freqs = [BETA_freq_map [label] for label in y_BETA[new_test_ind]]
    print("预测频率：", p_freqs)
    print("真实频率：", y_freqs)
    pre_accs.append(np.mean(p_labels == y_BETA[new_test_ind]))
    print(f"第{k+1}折准确率: {pre_accs[-1]}")
    print(f"所有折准确率: {pre_accs}")
    # 保存最优模型
    if pre_accs[-1] > best_test_acc:
        best_test_acc = pre_accs[-1]
        best_state_dict = copy.deepcopy(estimator.module.state_dict())
print("平均准确率：", np.mean(pre_accs))
# 保存测试集上最优的模型
if best_state_dict is not None:
    torch.save(best_state_dict, BETA_save_path)


cuda
(3200, 9, 250)
train_ind数量: 2400, validate_ind数量: 800, test_ind数量: 800
  epoch    train_acc    train_loss    valid_acc    valid_loss    cp      lr     dur
-------  -----------  ------------  -----------  ------------  ----  ------  ------
      1       [36m0.0267[0m        [32m3.8976[0m       [35m0.0250[0m        [31m3.6864[0m     +  0.0010  1.2966
      2       [36m0.0300[0m        [32m3.7997[0m       [35m0.0350[0m        [31m3.6783[0m     +  0.0010  0.4765
      3       [36m0.0304[0m        [32m3.7375[0m       [35m0.0425[0m        [31m3.6646[0m     +  0.0010  0.4740
      4       [36m0.0338[0m        [32m3.7213[0m       [35m0.0563[0m        [31m3.6518[0m     +  0.0010  0.4785
      5       [36m0.0371[0m        [32m3.6894[0m       [35m0.0750[0m        [31m3.6370[0m     +  0.0010  0.4836
      6       [36m0.0417[0m        [32m3.6747[0m       [35m0.0800[0m        [31m3.6197[0m     +  0.0010  0.4763
      7       [36m0.0512[0m       

In [5]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)
test_subjects = [36,37,49,62,66,67,70] # 测试使用 #list(range(36,71))
pre_save_path = "BETA_eegnet_Sparse_dropout_1s_0.0.pth"
# 加载预训练模型
F1 = 20
D = 2
F2 = 40
n_channels = X_3s.shape[1]
n_samples = X_3s.shape[2]
n_classes = 40
time_kernel_length = 50
shared_ratio = 0
alpha = 1.0
epsilon = 30
estimator = EEGNet_Sparse(F1,D,F2,n_channels,n_samples,n_classes,time_kernel_length,shared_ratio,alpha,epsilon)
estimator.set_params(device=device)
estimator.initialize()  
estimator.module.load_state_dict(torch.load(pre_save_path))
subject_accs = {}

# 逐一验证每个被试
for test_subj in test_subjects:
    # 获取该被试的数据
    X, y, meta = paradigm_3s.get_data(
        BETA_dataset,
        subjects=[test_subj],
        return_concat=True,
        n_jobs=None,
        verbose=False
    )
    
    # 直接用预训练模型预测
    preds = estimator.predict(X)
    acc = np.mean(preds == y)
    subject_accs[str(test_subj)] = acc


# 先把每个被试的准确率转成百分比并保留一位小数
acc_list = [round(acc * 100, 1) for acc in subject_accs.values()]
# 逐一打印单个被试
for subj, acc in zip(test_subjects, acc_list):
    print(f"subject {subj} 的准确率: {acc:.1f}%")

# 打印所有被试准确率（字典仍是原始小数）
print("所有被试的准确率：", subject_accs)

# 基于百分比后的数值再算平均
mean_acc = np.mean(acc_list)
print(f"所有被试的平均准确率: {mean_acc:.1f}%")

# 额外一行：只显示所有被试准确率（百分数），逗号隔开
print("所有被试准确率（无名称）:", ",".join([f"{acc:.1f}" for acc in acc_list]))

cuda
--------ssssss, /upload/liubingchuan/S31-S40.tar.gz
--------ssssss, /upload/liubingchuan/S31-S40.tar.gz
--------ssssss, /upload/liubingchuan/S41-S50.tar.gz
--------ssssss, /upload/liubingchuan/S61-S70.tar.gz
--------ssssss, /upload/liubingchuan/S61-S70.tar.gz
--------ssssss, /upload/liubingchuan/S61-S70.tar.gz
--------ssssss, /upload/liubingchuan/S61-S70.tar.gz
subject 36 的准确率: 51.2%
subject 37 的准确率: 65.0%
subject 49 的准确率: 55.0%
subject 62 的准确率: 68.8%
subject 66 的准确率: 61.9%
subject 67 的准确率: 44.4%
subject 70 的准确率: 46.2%
所有被试的准确率： {'36': 0.5125, '37': 0.65, '49': 0.55, '62': 0.6875, '66': 0.61875, '67': 0.44375, '70': 0.4625}
所有被试的平均准确率: 56.1%
所有被试准确率（无名称）: 51.2,65.0,55.0,68.8,61.9,44.4,46.2


In [6]:
#**************************************************
# Benchmark数据集读取处理
#**************************************************
Bench_dataset = Wang2016()
subject_list = list(range(1, 21))  # 被试编号从1到20
for s in subject_list:
    Bench_dataset.data_path(subject=s, path="E:\\MetaBCI-master\\mne_data")  # 依次为每个被试设置路径
events = Bench_dataset.events.keys()
freq_list = [str(Bench_dataset.get_freq(event)) for event in events]  # 获得所有刺激的频率
freq_map = {i: freq for i, freq in enumerate(freq_list)}  # 标签到频率的映射

Bench_subjects = list(range(1, 21))  # 使用S1–S20被试进行训练
Bench_paradigm = SSVEP(
    channels=['POZ', 'PZ', 'PO3', 'PO5', 'PO4', 'PO6', 'O1', 'OZ', 'O2'],  # 选择电极通道
    intervals=[(0.14, 1.14)],  # 分析时间窗最长-0.5-5.5s ,0.0是刺激开始
    events=freq_list,  # 选择所有刺激频率
    srate=250  # 采样率
)

# add 5-90Hz bandpass filter in raw hook
# 对原始EEG信号做5-90Hz带通滤波。
def raw_hook(raw, caches):
    raw.filter(5, 90, l_trans_bandwidth=2, h_trans_bandwidth=5, phase='zero-double')
    caches['raw_stage'] = caches.get('raw_stage', -1) + 1
    return raw, caches

Bench_paradigm.register_raw_hook(raw_hook)



# 获取微调数据
X_Bench, y_Bench, meta_Bench = Bench_paradigm.get_data(
    Bench_dataset,
    subjects=Bench_subjects,
    return_concat=True,
    n_jobs=None,
    verbose=False
)

--------ssssss, /upload/yijun/S1.mat.7z
--------ssssss, /upload/yijun/S2.mat.7z
--------ssssss, /upload/yijun/S3.mat.7z
--------ssssss, /upload/yijun/S4.mat.7z
--------ssssss, /upload/yijun/S5.mat.7z
--------ssssss, /upload/yijun/S6.mat.7z
--------ssssss, /upload/yijun/S7.mat.7z
--------ssssss, /upload/yijun/S8.mat.7z
--------ssssss, /upload/yijun/S9.mat.7z
--------ssssss, /upload/yijun/S10.mat.7z
--------ssssss, /upload/yijun/S11.mat.7z
--------ssssss, /upload/yijun/S12.mat.7z
--------ssssss, /upload/yijun/S13.mat.7z
--------ssssss, /upload/yijun/S14.mat.7z
--------ssssss, /upload/yijun/S15.mat.7z
--------ssssss, /upload/yijun/S16.mat.7z
--------ssssss, /upload/yijun/S17.mat.7z
--------ssssss, /upload/yijun/S18.mat.7z
--------ssssss, /upload/yijun/S19.mat.7z
--------ssssss, /upload/yijun/S20.mat.7z
--------ssssss, /upload/yijun/S1.mat.7z
--------ssssss, /upload/yijun/S2.mat.7z
--------ssssss, /upload/yijun/S3.mat.7z
--------ssssss, /upload/yijun/S4.mat.7z
--------ssssss, /upload/yijun

In [7]:
#**************************************************
# Benchmark数据集  EEGNET网络
# !python3.8 Bench_freezing.py # Bench 1e-4学习率，S1~S20  F1=40,D=2,F2=80,Epsilon=20,shared_ratio=0.3,alpha=1.0
# 所有折准确率: [0.68125, 0.6325, 0.6075, 0.6575, 0.655, 0.64375]
# 平均准确率： 0.6462500000000001
#**************************************************
# 设置device（如果GPU可用则使用GPU，否则使用CPU）
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)
# 设置随机种子
set_random_seeds(42)
kfold = 6
print(X_Bench.shape)  # (2160, 9, 1250)
indices = generate_kfold_indices(meta_Bench, kfold=kfold)

# 预训练阶段
F1 = 20
D = 2
F2 = 40
n_channels = X_Bench.shape[1] # 输入信号的通道数
n_samples = X_Bench.shape[2] # 输入信号的采样点数，时长*采样率
n_classes = 40
time_kernel_length = 50
shared_ratio = 0
alpha = 1.0
epsilon = 30

Bench_save_path = "Bench_eegnet_Sparse_dropout_1s_0.0.pth"

pre_accs = []
best_test_acc = -1
best_state_dict = None

for k in range(kfold):
    # 初始化模型
    estimator = EEGNet_Sparse(F1,D,F2,n_channels,n_samples,n_classes,time_kernel_length,shared_ratio,alpha,epsilon)
    estimator.set_params(optimizer__lr=1e-3,device=device) # optimizer__lr=3e-3,
    train_ind, validate_ind, test_ind = match_kfold_indices(k, meta_Bench, indices)
    # 合并train_ind和validate_ind作为新的训练集索引
    new_train_ind = np.concatenate([train_ind, validate_ind])
    new_valid_ind = test_ind  # 用test_ind作为验证集
    new_test_ind = test_ind   # 用test_ind作为测试集

    print(f"train_ind数量: {len(new_train_ind)}, validate_ind数量: {len(new_valid_ind)}, test_ind数量: {len(new_test_ind)}")
    valid_ds = torch.utils.data.TensorDataset(
        torch.tensor(X_Bench[new_valid_ind], dtype=torch.float64),
        torch.tensor(y_Bench[new_valid_ind], dtype=torch.long)
    )
    estimator.set_params(train_split=predefined_split(valid_ds))
    estimator.fit(X_Bench[new_train_ind], y_Bench[new_train_ind])
    # 测试集评估
    p_labels = estimator.predict(X_Bench[new_test_ind])
    p_freqs = [freq_map[label] for label in p_labels]
    y_freqs = [freq_map[label] for label in y_Bench[new_test_ind]]
    print("预测频率：", p_freqs)
    print("真实频率：", y_freqs)
    pre_accs.append(np.mean(p_labels == y_Bench[new_test_ind]))
    print(f"第{k+1}折准确率: {pre_accs[-1]}")
    # 保存最优模型
    if pre_accs[-1] > best_test_acc:
        best_test_acc = pre_accs[-1]
        best_state_dict = copy.deepcopy(estimator.module.state_dict())
print(f"所有折准确率: {pre_accs}")
print("平均准确率：", np.mean(pre_accs))
# 保存测试集上最优的模型
if best_state_dict is not None:
    torch.save(best_state_dict, Bench_save_path)

cuda
(4800, 9, 250)
train_ind数量: 4000, validate_ind数量: 800, test_ind数量: 800
  epoch    train_acc    train_loss    valid_acc    valid_loss    cp      lr     dur
-------  -----------  ------------  -----------  ------------  ----  ------  ------
      1       [36m0.0267[0m        [32m3.8666[0m       [35m0.0338[0m        [31m3.6862[0m     +  0.0010  0.9993
      2       [36m0.0325[0m        [32m3.7452[0m       [35m0.0462[0m        [31m3.6678[0m     +  0.0010  0.7216
      3       [36m0.0355[0m        [32m3.7027[0m       [35m0.0612[0m        [31m3.6474[0m     +  0.0010  0.7108
      4       [36m0.0442[0m        [32m3.6699[0m       [35m0.0963[0m        [31m3.6202[0m     +  0.0010  0.7197
      5       [36m0.0563[0m        [32m3.6322[0m       [35m0.1138[0m        [31m3.5884[0m     +  0.0010  0.7239
      6       [36m0.0683[0m        [32m3.6005[0m       [35m0.1363[0m        [31m3.5438[0m     +  0.0010  0.7284
      7       [36m0.0862[0m       

In [9]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)
test_subjects = [22,24,27,28,31,34,35] # 测试使用 
pre_save_path = "Bench_eegnet_Sparse_dropout_1s_0.0.pth"
# 加载预训练模型
F1 = 20
D = 2
F2 = 40
n_channels = X_Bench.shape[1] # 输入信号的通道数
n_samples = X_Bench.shape[2] # 输入信号的采样点数，时长*采样率
n_classes = 40
time_kernel_length = 50
shared_ratio = 0
alpha = 1.0
epsilon = 30
estimator = EEGNet_Sparse(F1,D,F2,n_channels,n_samples,n_classes,time_kernel_length,shared_ratio,alpha,epsilon)
estimator.set_params(device=device)
estimator.initialize()  
estimator.module.load_state_dict(torch.load(pre_save_path))
subject_accs = {}

# 逐一验证每个被试
for test_subj in test_subjects:
    # 获取该被试的数据
    X, y, meta = Bench_paradigm.get_data(
        Bench_dataset,
        subjects=[test_subj],
        return_concat=True,
        n_jobs=None,
        verbose=False
    )
    
    # 直接用预训练模型预测
    preds = estimator.predict(X)
    acc = np.mean(preds == y)
    subject_accs[str(test_subj)] = acc

# 先把每个被试的准确率转成百分比并保留一位小数
acc_list = [round(acc * 100, 1) for acc in subject_accs.values()]
# 逐一打印单个被试
for subj, acc in zip(test_subjects, acc_list):
    print(f"subject {subj} 的准确率: {acc:.1f}%")

# 打印所有被试准确率（字典仍是原始小数）
print("所有被试的准确率：", subject_accs)

# 基于百分比后的数值再算平均
mean_acc = np.mean(acc_list)
print(f"所有被试的平均准确率: {mean_acc:.1f}%")

# 额外一行：只显示所有被试准确率（百分数），逗号隔开
print("所有被试准确率（无名称）:", ",".join([f"{acc:.1f}" for acc in acc_list]))

cuda
--------ssssss, /upload/yijun/S22.mat.7z
--------ssssss, /upload/yijun/S24.mat.7z
--------ssssss, /upload/yijun/S27.mat.7z
--------ssssss, /upload/yijun/S28.mat.7z
--------ssssss, /upload/yijun/S31.mat.7z
--------ssssss, /upload/yijun/S34.mat.7z
--------ssssss, /upload/yijun/S35.mat.7z
subject 22 的准确率: 77.1%
subject 24 的准确率: 77.9%
subject 27 的准确率: 83.8%
subject 28 的准确率: 69.6%
subject 31 的准确率: 77.5%
subject 34 的准确率: 67.1%
subject 35 的准确率: 80.4%
所有被试的准确率： {'22': 0.7708333333333334, '24': 0.7791666666666667, '27': 0.8375, '28': 0.6958333333333333, '31': 0.775, '34': 0.6708333333333333, '35': 0.8041666666666667}
所有被试的平均准确率: 76.2%
所有被试准确率（无名称）: 77.1,77.9,83.8,69.6,77.5,67.1,80.4
