# Set up environment

In [1]:
%load_ext autoreload
%autoreload 2
%matplotlib inline

In [2]:
# Test if GPU is available
# Note that CUDA below 12.1 can have bugs
import torch
print(torch.cuda.is_available())
# print(torch.cuda.get_device_name(0))
print(torch.version.cuda)
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

True
12.1


In [3]:
#%% import libraries
import os
from collections import defaultdict
import sys

import matplotlib.pyplot as plt
import pandas as pd
import seaborn as sns
import copy
import numpy as np
import numpy.random
from numpy.fft import fft as fft
from numpy.fft import ifft as ifft
import pickle
from sklearn.linear_model import PoissonRegressor
from sklearn.model_selection import KFold
from sklearn.manifold import TSNE
import scipy.stats
from scipy.stats import wilcoxon, chi2
import scipy.interpolate 
import scipy.signal
from scipy import linalg
from scipy.special import rel_entr
from tqdm import tqdm
import pandas as pd
import joblib
import logging

import statsmodels.api as sm
import statsmodels.genmod.generalized_linear_model as smm

import torch
from torch.autograd import Variable
from torch.nn import functional as F
import torch.nn as nn
import torch.optim as optim

In [4]:
# import my code
import utility_functions as utils
import GLM
from DataLoader import Allen_dataset, Allen_dataloader_multi_session, Simple_dataloader_from_spikes
from model_trainer import Trainer

utils.set_seed(0)

  from .autonotebook import tqdm as notebook_tqdm


# Load data

In [None]:
# Load GLM neuron dataset
file_name = '/home/qix/user_data/EIF_simulation_dataset/synthetic_data_GLM.npz'
data = np.load(file_name)
spikes = data['spikes'][:,:,:]
nneuron = spikes.shape[1]//2
synthetic_GLM_dataloader = Simple_dataloader_from_spikes(
    [spikes[:,:nneuron,:], spikes[:,nneuron:,:]],
    npadding=50,
    train_ratio=0.7,
    val_ratio=0.1,
    batch_size=64,
    verbose=True
)

# Load EIF neuron dataset
file_name = f'/home/qix/user_data/EIF_simulation_dataset/synthetic_data_EIF_connTrue.npz'
data = np.load(file_name, allow_pickle=True)
spikes = data['spikes'][:,:,:]
nneuron = spikes.shape[1]//2
synthetic_EIF_dataloader = Simple_dataloader_from_spikes(
    [spikes[:,:nneuron,:], spikes[:,nneuron:,:]],
    npadding=50,
    train_ratio=0.7,
    val_ratio=0.1,
    batch_size=64,
    verbose=True
)

# Load real dataset
if sys.platform == 'linux':
    data_path = '/home/qix/user_data/allen_spike_trains/single_sessions.joblib'
else:
    data_path = 'D:/ecephys_cache_dir/single_sessions.joblib'
real_dataloader = joblib.load(data_path)

In [90]:
spikes = np.zeros((250, 352, 38*64+35))
trial_idx = 0
for batch in real_dataloader.test_loader:
    spikes[:, :, trial_idx:trial_idx+batch['spike_trains'].shape[2]] = batch['spike_trains']
    trial_idx += batch['spike_trains'].shape[2]
acc_nneuron = [0] + list(np.cumsum(real_dataloader.sessions[757216464].nneuron_list))

real_dataloader_fast = Simple_dataloader_from_spikes(
    [spikes[:,acc_nneuron[i]:acc_nneuron[i+1],:] for i in range(len(acc_nneuron)-1)],
    npadding=50,
    train_ratio=0.7,
    val_ratio=0.1,
    batch_size=64,
    verbose=True
)

# Ablation experiments

In [93]:
# Settings for all ablation experiments
verbose = False
# datasets = [synthetic_GLM_dataloader, synthetic_EIF_dataloader]
datasets = [synthetic_GLM_dataloader, synthetic_EIF_dataloader, real_dataloader_fast]
nrep = 5
ckp_path = '/home/qix/user_data/VAETransformer_checkpoint_ablation'

params_set = {}
params_set[0] = {
    # B-spline basis
    'num_B_spline_basis': 10,
    # Transformer VAE's settings
    'downsample_factor': 10,
    'transformer_num_layers': 2,
    'transformer_d_model': 128,
    'transformer_dim_feedforward': 512,
    'transformer_vae_output_dim': 8,
    'transformer_dropout': 0.0,
    'transformer_nhead': 1,
    'stimulus_nfactor': 2,
    'stimulus_decoder_inter_dim_factor': 2,
    'beta': 1.0,
    'use_area_specific_decoder': True,
    'use_area_specific_encoder': True,
    'use_cls': False,
    # Coupling's settings
    'coupling_basis_peaks_max': 7,
    'coupling_basis_num': 3,
    'coupling_nsubspace': 1,
    'use_self_coupling': True,
    # Coupling strength latent's settings
    'K_sigma2': 1.0,
    'K_tau': 100,
    'coupling_strength_nlatent': 1,
    # Self-history's settings
    'self_history_basis_peaks_max': 2,
    'self_history_basis_num': 3,
    'self_history_basis_nonlinear': 0.7,
    # Penalty settings
    'penalty_smoothing_spline': 1e3,
    'penalty_coupling_subgroup': 1e-5,
    'penalty_diff_loading': None,
    'penalty_loading_similarity': None,
    # Training settings
    'batch_size': 64,
    'sample_latent': False,
    'lr': 1e-3,
    'epoch_warm_up': 0,
    'epoch_patience': 3,
    'epoch_max': 200,
    'tol': 1e-5,
    'weight_decay': 0,
    'lr_transformer': 1e-4,
    'lr_sti': 1e-2,
    'lr_cp': 1e-2,
    'lr_self_history': 1e-2,
}

params_set[1] = {
    # B-spline basis
    'num_B_spline_basis': 20,
    # Transformer VAE's settings
    'downsample_factor': 10,
    'transformer_num_layers': 2,
    'transformer_d_model': 128,
    'transformer_dim_feedforward': 512,
    'transformer_vae_output_dim': 16,
    'transformer_dropout': 0.0,
    'transformer_nhead': 1,
    'stimulus_nfactor': 1,
    'stimulus_decoder_inter_dim_factor': 2,
    'beta': 1.0,
    'use_area_specific_decoder': True,
    'use_area_specific_encoder': True,
    'use_cls': False,
    # Coupling's settings
    'coupling_basis_peaks_max': 5,
    'coupling_basis_num': 3,
    'coupling_nsubspace': 1,
    'use_self_coupling': True,
    # Coupling strength latent's settings
    'K_sigma2': 1.0,
    'K_tau': 100,
    'coupling_strength_nlatent': 1,
    # Self-history's settings
    'self_history_basis_peaks_max': 1.5,
    'self_history_basis_num': 3,
    'self_history_basis_nonlinear': 1,
    # Penalty settings
    'penalty_smoothing_spline': 1e3,
    'penalty_coupling_subgroup': 1e-5,
    'penalty_diff_loading': None,
    'penalty_loading_similarity': None,
    # Training settings
    'batch_size': 64,
    'sample_latent': False,
    'lr': 1e-3,
    'epoch_warm_up': 0,
    'epoch_patience': 3,
    'epoch_max': 200,
    'tol': 1e-5,
    'weight_decay': 0,
    'lr_transformer': 1e-4,
    'lr_sti': 1e-2,
    'lr_cp': 1e-2,
    'lr_self_history': 1e-2,
}

params_set[2] = {
    # B-spline basis
    'num_B_spline_basis': 10,
    # Transformer VAE's settings
    'downsample_factor': 10,
    'transformer_num_layers': 2,
    'transformer_d_model': 128,
    'transformer_dim_feedforward': 512,
    'transformer_vae_output_dim': 12,
    'transformer_dropout': 0.0,
    'transformer_nhead': 1,
    'stimulus_nfactor': 2,
    'stimulus_decoder_inter_dim_factor': 2,
    'beta': 1.0,
    'use_area_specific_decoder': True,
    'use_area_specific_encoder': True,
    'use_cls': False,
    # Coupling's settings
    'coupling_basis_peaks_max': 7,
    'coupling_basis_num': 3,
    'coupling_nsubspace': 1,
    'use_self_coupling': True,
    # Coupling strength latent's settings
    'K_sigma2': 1.0,
    'K_tau': 100,
    'coupling_strength_nlatent': 1,
    # Self-history's settings
    'self_history_basis_peaks_max': 1.5,
    'self_history_basis_num': 3,
    'self_history_basis_nonlinear': 1,
    # Penalty settings
    'penalty_smoothing_spline': 1e3,
    'penalty_coupling_subgroup': 1e-5,
    'penalty_diff_loading': None,
    'penalty_loading_similarity': None,
    # Training settings
    'batch_size': 64,
    'sample_latent': False,
    'lr': 1e-3,
    'epoch_warm_up': 0,
    'epoch_patience': 3,
    'epoch_max': 50,
    'tol': 1e-5,
    'weight_decay': 0,
    'lr_transformer': 1e-4,
    'lr_sti': 1e-2,
    'lr_cp': 1e-2,
    'lr_self_history': 1e-2,
}

In [94]:
# Full model
results_ablation = np.zeros((len(datasets), nrep))

for idata, data_to_use in enumerate(datasets):
    for irep in range(nrep):

        trainer = Trainer(data_to_use, ckp_path, params_set[idata])
        
        # First step: train the model with a trial-invariant stimulus effect
        trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=False,
            fix_stimulus=True,
            fix_latents=True,
            verbose=verbose,
        )
        # Second step: train the model with a trial-varying stimulus effect
        # trainer.make_optimizer(frozen_params=['sti_readout'])
        trainer.make_optimizer(frozen_params=['sti_inhomo', ]) # We are fixing the trial-invariant stimulus effect
        trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=False,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
        # trainer.make_optimizer(frozen_params=[])
        trainer.train(
            include_stimulus=True,
            include_coupling=True,
            include_self_history=False,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        # trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
        trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter',
            'sti_readout', 'sti_decoder', 'sti_inhomo', 'cp_latents_readout', 'cp_time_varying_coef_offset', 
            'cp_beta_coupling', 'cp_weight_sending', 'cp_weight_receiving'])
        # trainer.make_optimizer(frozen_params=[])
        test_loss = trainer.train(
            include_stimulus=True,
            include_coupling=True,
            include_self_history=True,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        results_ablation[idata, irep] = test_loss

np.save('/home/qix/user_data/EIF_simulation_dataset/results_ablation_full_model.npy', results_ablation)



Model initialized. Training on cuda


 24%|██▎       | 47/200 [00:03<00:12, 12.00it/s]
  self.model.load_state_dict(torch.load(self.temp_best_model_path))
 50%|█████     | 101/200 [00:10<00:10,  9.46it/s]
 10%|█         | 20/200 [00:02<00:21,  8.40it/s]
 27%|██▋       | 54/200 [00:06<00:17,  8.35it/s]


Model initialized. Training on cuda


 22%|██▎       | 45/200 [00:03<00:12, 12.88it/s]
 60%|██████    | 120/200 [00:13<00:08,  8.94it/s]
 10%|█         | 20/200 [00:02<00:22,  7.91it/s]
 27%|██▋       | 54/200 [00:06<00:16,  8.77it/s]


Model initialized. Training on cuda


 24%|██▍       | 48/200 [00:03<00:11, 13.66it/s]
 38%|███▊      | 77/200 [00:08<00:13,  9.22it/s]
 11%|█         | 22/200 [00:03<00:25,  6.93it/s]
 26%|██▌       | 52/200 [00:06<00:18,  8.10it/s]


Model initialized. Training on cuda


 20%|██        | 40/200 [00:03<00:13, 11.52it/s]
 30%|███       | 60/200 [00:06<00:15,  9.03it/s]
 10%|▉         | 19/200 [00:02<00:22,  8.19it/s]
 27%|██▋       | 54/200 [00:07<00:20,  7.30it/s]


Model initialized. Training on cuda


 24%|██▍       | 49/200 [00:03<00:10, 13.83it/s]
 26%|██▋       | 53/200 [00:05<00:15,  9.76it/s]
 11%|█         | 22/200 [00:02<00:18,  9.61it/s]
 27%|██▋       | 54/200 [00:06<00:16,  8.96it/s]


Model initialized. Training on cuda


 34%|███▎      | 67/200 [00:05<00:10, 13.27it/s]
 16%|█▌        | 31/200 [00:03<00:17,  9.82it/s]
 12%|█▏        | 23/200 [00:02<00:17,  9.94it/s]
 28%|██▊       | 56/200 [00:06<00:17,  8.18it/s]


Model initialized. Training on cuda


 30%|███       | 61/200 [00:04<00:11, 12.60it/s]
 24%|██▎       | 47/200 [00:04<00:15,  9.96it/s]
  9%|▉         | 18/200 [00:02<00:22,  8.16it/s]
 28%|██▊       | 56/200 [00:06<00:16,  8.95it/s]


Model initialized. Training on cuda


 34%|███▍      | 69/200 [00:05<00:09, 13.47it/s]
 29%|██▉       | 58/200 [00:06<00:16,  8.58it/s]
 10%|▉         | 19/200 [00:02<00:24,  7.46it/s]
 28%|██▊       | 55/200 [00:06<00:16,  8.65it/s]


Model initialized. Training on cuda


 33%|███▎      | 66/200 [00:04<00:09, 13.84it/s]
 24%|██▍       | 49/200 [00:04<00:15,  9.96it/s]
  8%|▊         | 16/200 [00:01<00:20,  8.86it/s]
 28%|██▊       | 56/200 [00:07<00:19,  7.50it/s]


Model initialized. Training on cuda


 36%|███▌      | 71/200 [00:05<00:09, 13.79it/s]
 22%|██▏       | 44/200 [00:04<00:17,  9.08it/s]
 10%|█         | 21/200 [00:02<00:20,  8.89it/s]
 28%|██▊       | 56/200 [00:06<00:16,  8.86it/s]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:19<00:10,  1.67it/s]
 72%|███████▏  | 36/50 [00:30<00:11,  1.19it/s]
 34%|███▍      | 17/50 [00:22<00:44,  1.34s/it]
 32%|███▏      | 16/50 [00:22<00:47,  1.39s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:20<00:10,  1.60it/s]
100%|██████████| 50/50 [00:40<00:00,  1.22it/s]
 20%|██        | 10/50 [00:14<00:57,  1.43s/it]
 26%|██▌       | 13/50 [00:18<00:51,  1.40s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:21<00:11,  1.54it/s]
100%|██████████| 50/50 [00:39<00:00,  1.26it/s]
 20%|██        | 10/50 [00:13<00:55,  1.39s/it]
 32%|███▏      | 16/50 [00:21<00:45,  1.34s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:20<00:10,  1.62it/s]
 80%|████████  | 40/50 [00:33<00:08,  1.19it/s]
 18%|█▊        | 9/50 [00:13<00:59,  1.46s/it]
 32%|███▏      | 16/50 [00:21<00:45,  1.35s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:19<00:10,  1.69it/s]
100%|██████████| 50/50 [00:41<00:00,  1.21it/s]
 36%|███▌      | 18/50 [00:23<00:42,  1.32s/it]
 26%|██▌       | 13/50 [00:18<00:51,  1.40s/it]


In [95]:
# Without Transformer encoder model
results_ablation = np.zeros((len(datasets), nrep))

for idata, data_to_use in enumerate(datasets):
    for irep in range(nrep):

        trainer = Trainer(data_to_use, ckp_path, params_set[idata])
        
        # First step: train the model with a trial-invariant stimulus effect
        trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=False,
            fix_stimulus=True,
            fix_latents=True,
            verbose=verbose,
        )

        trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
        # trainer.make_optimizer(frozen_params=[])
        trainer.train(
            include_stimulus=True,
            include_coupling=True,
            include_self_history=False,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        # trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
        trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter',
            'sti_readout', 'sti_decoder', 'sti_inhomo', 'cp_latents_readout', 'cp_time_varying_coef_offset', 
            'cp_beta_coupling', 'cp_weight_sending', 'cp_weight_receiving'])
        # trainer.make_optimizer(frozen_params=[])
        test_loss = trainer.train(
            include_stimulus=True,
            include_coupling=True,
            include_self_history=True,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        results_ablation[idata, irep] = test_loss

np.save('/home/qix/user_data/EIF_simulation_dataset/results_ablation_wo_encoder.npy', results_ablation)

Model initialized. Training on cuda


 22%|██▏       | 44/200 [00:03<00:12, 12.47it/s]
 10%|█         | 21/200 [00:02<00:18,  9.42it/s]
 30%|███       | 60/200 [00:07<00:17,  8.08it/s]


Model initialized. Training on cuda


 25%|██▌       | 50/200 [00:04<00:12, 12.45it/s]
 52%|█████▎    | 105/200 [00:13<00:12,  7.80it/s]
 28%|██▊       | 56/200 [00:06<00:16,  8.57it/s]


Model initialized. Training on cuda


 24%|██▍       | 49/200 [00:04<00:12, 12.01it/s]
 32%|███▏      | 63/200 [00:08<00:17,  7.80it/s]
 29%|██▉       | 58/200 [00:06<00:16,  8.49it/s]


Model initialized. Training on cuda


 26%|██▋       | 53/200 [00:03<00:11, 13.31it/s]
 28%|██▊       | 57/200 [00:06<00:16,  8.81it/s]
 29%|██▉       | 58/200 [00:06<00:15,  8.94it/s]


Model initialized. Training on cuda


 24%|██▍       | 48/200 [00:03<00:12, 12.02it/s]
 30%|███       | 60/200 [00:07<00:17,  7.92it/s]
 30%|██▉       | 59/200 [00:07<00:17,  8.22it/s]


Model initialized. Training on cuda


 34%|███▍      | 69/200 [00:04<00:09, 14.44it/s]
 18%|█▊        | 37/200 [00:04<00:20,  8.04it/s]
 28%|██▊       | 57/200 [00:07<00:18,  7.84it/s]


Model initialized. Training on cuda


 34%|███▍      | 68/200 [00:05<00:09, 13.32it/s]
 19%|█▉        | 38/200 [00:04<00:20,  7.86it/s]
 28%|██▊       | 57/200 [00:06<00:15,  9.19it/s]


Model initialized. Training on cuda


 31%|███       | 62/200 [00:04<00:09, 14.77it/s]
 34%|███▎      | 67/200 [00:07<00:15,  8.75it/s]
 28%|██▊       | 55/200 [00:06<00:16,  8.75it/s]


Model initialized. Training on cuda


 30%|███       | 61/200 [00:04<00:10, 13.47it/s]
 19%|█▉        | 38/200 [00:04<00:19,  8.34it/s]
 28%|██▊       | 56/200 [00:07<00:18,  7.74it/s]


Model initialized. Training on cuda


 34%|███▎      | 67/200 [00:05<00:11, 11.69it/s]
 15%|█▌        | 30/200 [00:02<00:16, 10.46it/s]
 28%|██▊       | 55/200 [00:06<00:17,  8.46it/s]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:20<00:11,  1.57it/s]
 54%|█████▍    | 27/50 [00:35<00:30,  1.31s/it]
 32%|███▏      | 16/50 [00:21<00:46,  1.36s/it]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:21<00:11,  1.51it/s]
 46%|████▌     | 23/50 [00:30<00:35,  1.33s/it]
 32%|███▏      | 16/50 [00:21<00:45,  1.35s/it]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:19<00:11,  1.62it/s]
 28%|██▊       | 14/50 [00:18<00:48,  1.35s/it]
 32%|███▏      | 16/50 [00:21<00:46,  1.36s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:20<00:10,  1.61it/s]
 56%|█████▌    | 28/50 [00:36<00:28,  1.31s/it]
 32%|███▏      | 16/50 [00:21<00:45,  1.33s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:18<00:09,  1.78it/s]
 68%|██████▊   | 34/50 [00:45<00:21,  1.35s/it]
 26%|██▌       | 13/50 [00:17<00:50,  1.36s/it]


In [96]:
# Without coupling
results_ablation = np.zeros((len(datasets), nrep))

for idata, data_to_use in enumerate(datasets):
    for irep in range(nrep):

        trainer = Trainer(data_to_use, ckp_path, params_set[idata])
        
        # First step: train the model with a trial-invariant stimulus effect
        trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=False,
            fix_stimulus=True,
            fix_latents=True,
            verbose=verbose,
        )
        # Second step: train the model with a trial-varying stimulus effect
        # trainer.make_optimizer(frozen_params=['sti_readout'])
        trainer.make_optimizer(frozen_params=['sti_inhomo', ]) # We are fixing the trial-invariant stimulus effect
        trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=False,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        # trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
        trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter',
            'sti_readout', 'sti_decoder', 'sti_inhomo', 'cp_latents_readout', 'cp_time_varying_coef_offset', 
            'cp_beta_coupling', 'cp_weight_sending', 'cp_weight_receiving'])
        # trainer.make_optimizer(frozen_params=[])
        test_loss = trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=True,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        results_ablation[idata, irep] = test_loss
np.save('/home/qix/user_data/EIF_simulation_dataset/results_ablation_wo_coupling.npy', results_ablation)

Model initialized. Training on cuda


 26%|██▌       | 51/200 [00:04<00:13, 11.27it/s]
  6%|▌         | 12/200 [00:01<00:20,  9.37it/s]
 38%|███▊      | 75/200 [00:07<00:12,  9.65it/s]


Model initialized. Training on cuda


 21%|██        | 42/200 [00:03<00:12, 12.74it/s]
 38%|███▊      | 76/200 [00:08<00:13,  9.48it/s]
 30%|██▉       | 59/200 [00:06<00:14,  9.42it/s]


Model initialized. Training on cuda


 24%|██▎       | 47/200 [00:03<00:11, 13.86it/s]
 18%|█▊        | 35/200 [00:04<00:19,  8.26it/s]
 36%|███▌      | 72/200 [00:06<00:12, 10.35it/s]


Model initialized. Training on cuda


 27%|██▋       | 54/200 [00:04<00:12, 11.62it/s]
 38%|███▊      | 76/200 [00:08<00:13,  8.87it/s]
 32%|███▏      | 63/200 [00:06<00:14,  9.32it/s]


Model initialized. Training on cuda


 28%|██▊       | 56/200 [00:04<00:11, 12.73it/s]
 43%|████▎     | 86/200 [00:08<00:10, 10.39it/s]
 32%|███▏      | 63/200 [00:06<00:13, 10.00it/s]


Model initialized. Training on cuda


 39%|███▉      | 78/200 [00:06<00:09, 12.28it/s]
 17%|█▋        | 34/200 [00:03<00:17,  9.48it/s]
 29%|██▉       | 58/200 [00:06<00:15,  9.31it/s]


Model initialized. Training on cuda


 36%|███▌      | 71/200 [00:05<00:10, 12.27it/s]
 20%|█▉        | 39/200 [00:03<00:16,  9.78it/s]
 27%|██▋       | 54/200 [00:05<00:14,  9.88it/s]


Model initialized. Training on cuda


 32%|███▏      | 64/200 [00:05<00:10, 12.73it/s]
 26%|██▋       | 53/200 [00:05<00:16,  9.14it/s]
 28%|██▊       | 57/200 [00:06<00:15,  9.30it/s]


Model initialized. Training on cuda


 31%|███       | 62/200 [00:04<00:09, 13.98it/s]
 24%|██▎       | 47/200 [00:05<00:17,  8.94it/s]
 28%|██▊       | 57/200 [00:05<00:14,  9.76it/s]


Model initialized. Training on cuda


 35%|███▌      | 70/200 [00:05<00:10, 12.19it/s]
 18%|█▊        | 35/200 [00:03<00:16, 10.12it/s]
 28%|██▊       | 56/200 [00:05<00:13, 10.81it/s]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:20<00:11,  1.58it/s]
 94%|█████████▍| 47/50 [00:39<00:02,  1.18it/s]
 28%|██▊       | 14/50 [00:12<00:33,  1.08it/s]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:20<00:11,  1.57it/s]
 76%|███████▌  | 38/50 [00:31<00:09,  1.20it/s]
 34%|███▍      | 17/50 [00:14<00:28,  1.17it/s]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:19<00:10,  1.69it/s]
 76%|███████▌  | 38/50 [00:32<00:10,  1.15it/s]
 34%|███▍      | 17/50 [00:14<00:28,  1.15it/s]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:21<00:11,  1.53it/s]
 90%|█████████ | 45/50 [00:38<00:04,  1.16it/s]
 32%|███▏      | 16/50 [00:13<00:28,  1.18it/s]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:20<00:11,  1.60it/s]
 50%|█████     | 25/50 [00:22<00:22,  1.12it/s]
 34%|███▍      | 17/50 [00:14<00:27,  1.19it/s]


In [97]:
# Without neuron's post-spike effects
results_ablation = np.zeros((len(datasets), nrep))

for idata, data_to_use in enumerate(datasets):
    for irep in range(nrep):

        trainer = Trainer(data_to_use, ckp_path, params_set[idata])
        
        # First step: train the model with a trial-invariant stimulus effect
        trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=False,
            fix_stimulus=True,
            fix_latents=True,
            verbose=verbose,
        )
        # Second step: train the model with a trial-varying stimulus effect
        # trainer.make_optimizer(frozen_params=['sti_readout'])
        trainer.make_optimizer(frozen_params=['sti_inhomo', ]) # We are fixing the trial-invariant stimulus effect
        test_loss = trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=False,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
        # trainer.make_optimizer(frozen_params=[])
        trainer.train(
            include_stimulus=True,
            include_coupling=True,
            include_self_history=False,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        results_ablation[idata, irep] = test_loss
np.save('/home/qix/user_data/EIF_simulation_dataset/results_ablation_wo_post_spike.npy', results_ablation)

Model initialized. Training on cuda


 24%|██▎       | 47/200 [00:03<00:12, 12.43it/s]
 26%|██▌       | 51/200 [00:05<00:16,  9.06it/s]
 10%|█         | 20/200 [00:02<00:22,  8.16it/s]


Model initialized. Training on cuda


 26%|██▋       | 53/200 [00:03<00:09, 15.61it/s]
 20%|█▉        | 39/200 [00:04<00:19,  8.33it/s]
 10%|█         | 21/200 [00:02<00:21,  8.16it/s]


Model initialized. Training on cuda


 24%|██▍       | 48/200 [00:03<00:11, 13.07it/s]
 34%|███▎      | 67/200 [00:06<00:12, 10.77it/s]
 11%|█         | 22/200 [00:02<00:19,  9.34it/s]


Model initialized. Training on cuda


 24%|██▍       | 48/200 [00:03<00:11, 12.71it/s]
 26%|██▌       | 51/200 [00:05<00:15,  9.86it/s]
 12%|█▏        | 23/200 [00:02<00:21,  8.24it/s]


Model initialized. Training on cuda


 24%|██▍       | 48/200 [00:03<00:12, 12.44it/s]
 37%|███▋      | 74/200 [00:08<00:13,  9.08it/s]
 10%|█         | 20/200 [00:02<00:21,  8.57it/s]


Model initialized. Training on cuda


 35%|███▌      | 70/200 [00:05<00:10, 12.98it/s]
 16%|█▋        | 33/200 [00:03<00:16, 10.05it/s]
 14%|█▍        | 28/200 [00:03<00:19,  8.88it/s]


Model initialized. Training on cuda


 40%|███▉      | 79/200 [00:05<00:08, 14.02it/s]
 10%|█         | 20/200 [00:02<00:19,  9.16it/s]
 10%|▉         | 19/200 [00:02<00:21,  8.49it/s]


Model initialized. Training on cuda


 34%|███▎      | 67/200 [00:05<00:10, 12.89it/s]
 34%|███▎      | 67/200 [00:07<00:14,  9.25it/s]
 16%|█▌        | 31/200 [00:03<00:17,  9.40it/s]


Model initialized. Training on cuda


 30%|██▉       | 59/200 [00:04<00:11, 12.12it/s]
 32%|███▏      | 64/200 [00:06<00:13,  9.82it/s]
 12%|█▏        | 24/200 [00:03<00:23,  7.52it/s]


Model initialized. Training on cuda


 36%|███▌      | 71/200 [00:05<00:09, 13.86it/s]
 15%|█▌        | 30/200 [00:03<00:17,  9.88it/s]
 20%|██        | 41/200 [00:05<00:20,  7.81it/s]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:19<00:11,  1.63it/s]
100%|██████████| 50/50 [00:42<00:00,  1.18it/s]
 22%|██▏       | 11/50 [00:15<00:54,  1.39s/it]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:19<00:10,  1.64it/s]
 90%|█████████ | 45/50 [00:38<00:04,  1.16it/s]
 36%|███▌      | 18/50 [00:24<00:43,  1.35s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:21<00:11,  1.50it/s]
 98%|█████████▊| 49/50 [00:41<00:00,  1.19it/s]
 22%|██▏       | 11/50 [00:15<00:55,  1.41s/it]


Model initialized. Training on cuda


 62%|██████▏   | 31/50 [00:18<00:11,  1.67it/s]
100%|██████████| 50/50 [00:45<00:00,  1.09it/s]
 26%|██▌       | 13/50 [00:22<01:04,  1.73s/it]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:22<00:12,  1.43it/s]
100%|██████████| 50/50 [00:42<00:00,  1.17it/s]
 18%|█▊        | 9/50 [00:12<00:58,  1.43s/it]


In [100]:
# Transformer -> RNN
results_ablation = np.zeros((len(datasets), nrep))

for idata, data_to_use in enumerate(datasets):
    for irep in range(nrep):

        trainer = Trainer(data_to_use, ckp_path, params_set[idata])
        
        # First step: train the model with a trial-invariant stimulus effect
        trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=False,
            fix_stimulus=True,
            fix_latents=True,
            verbose=verbose,
        )
        # Second step: train the model with a trial-varying stimulus effect
        # trainer.make_optimizer(frozen_params=['sti_readout'])
        trainer.make_optimizer(frozen_params=['sti_inhomo', ]) # We are fixing the trial-invariant stimulus effect
        trainer.train(
            include_stimulus=True,
            include_coupling=False,
            include_self_history=False,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
        # trainer.make_optimizer(frozen_params=[])
        trainer.train(
            include_stimulus=True,
            include_coupling=True,
            include_self_history=False,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        # trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
        trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter',
            'sti_readout', 'sti_decoder', 'sti_inhomo', 'cp_latents_readout', 'cp_time_varying_coef_offset', 
            'cp_beta_coupling', 'cp_weight_sending', 'cp_weight_receiving'])
        # trainer.make_optimizer(frozen_params=[])
        test_loss = trainer.train(
            include_stimulus=True,
            include_coupling=True,
            include_self_history=True,
            fix_stimulus=False,
            fix_latents=True,
            verbose=verbose,
        )

        results_ablation[idata, irep] = test_loss
np.save('/home/qix/user_data/EIF_simulation_dataset/results_ablation_rnn.npy', results_ablation)

Model initialized. Training on cuda


 24%|██▎       | 47/200 [00:03<00:10, 14.92it/s]
  4%|▍         | 9/200 [00:00<00:14, 13.09it/s]
 13%|█▎        | 26/200 [00:02<00:17,  9.96it/s]
 32%|███▏      | 63/200 [00:06<00:14,  9.37it/s]


Model initialized. Training on cuda


 26%|██▌       | 51/200 [00:03<00:08, 16.59it/s]
 23%|██▎       | 46/200 [00:04<00:13, 11.17it/s]
  9%|▉         | 18/200 [00:02<00:21,  8.47it/s]
 28%|██▊       | 57/200 [00:06<00:15,  8.96it/s]


Model initialized. Training on cuda


 24%|██▎       | 47/200 [00:02<00:09, 15.96it/s]
  7%|▋         | 14/200 [00:01<00:17, 10.82it/s]
 45%|████▌     | 90/200 [00:09<00:11,  9.52it/s]
 29%|██▉       | 58/200 [00:06<00:15,  9.23it/s]


Model initialized. Training on cuda


 26%|██▌       | 52/200 [00:03<00:10, 14.39it/s]
 37%|███▋      | 74/200 [00:06<00:10, 11.59it/s]
  9%|▉         | 18/200 [00:01<00:16, 11.17it/s]
 28%|██▊       | 55/200 [00:05<00:14, 10.14it/s]


Model initialized. Training on cuda


 26%|██▌       | 51/200 [00:03<00:09, 14.90it/s]
 11%|█         | 22/200 [00:01<00:15, 11.52it/s]
 22%|██▏       | 43/200 [00:04<00:16,  9.41it/s]
 28%|██▊       | 57/200 [00:06<00:15,  9.12it/s]


Model initialized. Training on cuda


 34%|███▍      | 68/200 [00:04<00:09, 14.35it/s]
 33%|███▎      | 66/200 [00:06<00:12, 10.58it/s]
 12%|█▏        | 23/200 [00:02<00:19,  9.14it/s]
 28%|██▊       | 56/200 [00:05<00:15,  9.47it/s]


Model initialized. Training on cuda


 38%|███▊      | 76/200 [00:05<00:08, 14.00it/s]
 44%|████▎     | 87/200 [00:07<00:09, 11.62it/s]
  7%|▋         | 14/200 [00:01<00:22,  8.42it/s]
 28%|██▊       | 56/200 [00:06<00:15,  9.13it/s]


Model initialized. Training on cuda


 32%|███▏      | 64/200 [00:04<00:09, 13.86it/s]
 42%|████▎     | 85/200 [00:08<00:11, 10.26it/s]
  9%|▉         | 18/200 [00:01<00:16, 10.92it/s]
 28%|██▊       | 55/200 [00:05<00:15,  9.48it/s]


Model initialized. Training on cuda


 35%|███▌      | 70/200 [00:04<00:09, 14.32it/s]
 38%|███▊      | 77/200 [00:06<00:10, 11.54it/s]
 32%|███▏      | 64/200 [00:06<00:14,  9.16it/s]
 28%|██▊       | 55/200 [00:06<00:16,  9.03it/s]


Model initialized. Training on cuda


 34%|███▍      | 68/200 [00:04<00:08, 16.25it/s]
 36%|███▋      | 73/200 [00:06<00:10, 11.93it/s]
  9%|▉         | 18/200 [00:01<00:17, 10.52it/s]
 28%|██▊       | 56/200 [00:05<00:13, 10.64it/s]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:19<00:11,  1.63it/s]
100%|██████████| 50/50 [00:38<00:00,  1.29it/s]
 24%|██▍       | 12/50 [00:15<00:50,  1.32s/it]
 32%|███▏      | 16/50 [00:20<00:44,  1.30s/it]


Model initialized. Training on cuda


 64%|██████▍   | 32/50 [00:19<00:10,  1.68it/s]
100%|██████████| 50/50 [00:40<00:00,  1.22it/s]
 28%|██▊       | 14/50 [00:17<00:46,  1.28s/it]
 26%|██▌       | 13/50 [00:17<00:49,  1.33s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:19<00:09,  1.70it/s]
100%|██████████| 50/50 [00:38<00:00,  1.30it/s]
 32%|███▏      | 16/50 [00:20<00:44,  1.31s/it]
 26%|██▌       | 13/50 [00:16<00:48,  1.31s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:20<00:10,  1.61it/s]
100%|██████████| 50/50 [00:38<00:00,  1.29it/s]
 20%|██        | 10/50 [00:13<00:53,  1.33s/it]
 32%|███▏      | 16/50 [00:21<00:45,  1.34s/it]


Model initialized. Training on cuda


 66%|██████▌   | 33/50 [00:19<00:10,  1.67it/s]
100%|██████████| 50/50 [00:40<00:00,  1.25it/s]
 18%|█▊        | 9/50 [00:12<00:56,  1.37s/it]
 26%|██▌       | 13/50 [00:17<00:48,  1.32s/it]


In [None]:
# Low-rank -> full-rank
# results_ablation = np.zeros((len(datasets), nrep))

# for idata, data_to_use in enumerate(datasets):
#     for irep in range(nrep):

#         trainer = Trainer(data_to_use, ckp_path, params_set[idata])
        
#         # First step: train the model with a trial-invariant stimulus effect
#         trainer.train(
#             include_stimulus=True,
#             include_coupling=False,
#             include_self_history=False,
#             fix_stimulus=True,
#             fix_latents=True,
#             verbose=verbose,
#         )
#         # Second step: train the model with a trial-varying stimulus effect
#         # trainer.make_optimizer(frozen_params=['sti_readout'])
#         trainer.make_optimizer(frozen_params=['sti_inhomo', ]) # We are fixing the trial-invariant stimulus effect
#         trainer.train(
#             include_stimulus=True,
#             include_coupling=False,
#             include_self_history=False,
#             fix_stimulus=False,
#             fix_latents=True,
#             verbose=verbose,
#         )

#         trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
#         # trainer.make_optimizer(frozen_params=[])
#         trainer.train(
#             include_stimulus=True,
#             include_coupling=True,
#             include_self_history=False,
#             fix_stimulus=False,
#             fix_latents=True,
#             verbose=verbose,
#         )

#         # trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter'])
#         trainer.make_optimizer(frozen_params=['transformer_encoder', 'to_latent', 'token_converter',
#             'sti_readout', 'sti_decoder', 'sti_inhomo', 'cp_latents_readout', 'cp_time_varying_coef_offset', 
#             'cp_beta_coupling', 'cp_weight_sending', 'cp_weight_receiving'])
#         # trainer.make_optimizer(frozen_params=[])
#         test_loss = trainer.train(
#             include_stimulus=True,
#             include_coupling=True,
#             include_self_history=True,
#             fix_stimulus=False,
#             fix_latents=True,
#             verbose=verbose,
#         )

#         results_ablation[idata, irep] = test_loss
# np.save('/home/qix/user_data/EIF_simulation_dataset/results_ablation_full_rank.npy', results_ablation)



Model initialized. Training on cuda


  4%|▍         | 8/200 [00:04<01:50,  1.73it/s]
  self.model.load_state_dict(torch.load(self.temp_best_model_path))
 24%|██▎       | 47/200 [00:34<01:51,  1.38it/s]
  4%|▎         | 7/200 [00:06<03:04,  1.05it/s]
  6%|▌         | 12/200 [00:11<03:01,  1.04it/s]


Model initialized. Training on cuda


  4%|▍         | 8/200 [00:04<01:40,  1.90it/s]
 18%|█▊        | 37/200 [00:27<02:00,  1.35it/s]
  6%|▌         | 11/200 [00:10<02:57,  1.07it/s]
  6%|▌         | 12/200 [00:12<03:09,  1.01s/it]


In [101]:
# Load results from different models
results_full = np.load('/home/qix/user_data/EIF_simulation_dataset/results_ablation_full_model.npy')
results_wo_encoder = np.load('/home/qix/user_data/EIF_simulation_dataset/results_ablation_wo_encoder.npy') 
results_wo_coupling = np.load('/home/qix/user_data/EIF_simulation_dataset/results_ablation_wo_coupling.npy')
results_wo_post_spike = np.load('/home/qix/user_data/EIF_simulation_dataset/results_ablation_wo_post_spike.npy')
results_rnn = np.load('/home/qix/user_data/EIF_simulation_dataset/results_ablation_rnn.npy')

# Calculate mean and sem for each model and dataset
def mean_sem(data):
    return f"{data.mean():.5f} ({data.std()/np.sqrt(len(data)):.5f})"

# Create table rows
table_rows = []
for i in range(len(datasets)):
    row = [
        mean_sem(results_full[i,:]),
        mean_sem(results_wo_encoder[i,:]), 
        mean_sem(results_wo_coupling[i,:]),
        mean_sem(results_wo_post_spike[i,:]),
        mean_sem(results_rnn[i,:])
    ]
    table_rows.append(row)

# Print table
print("Dataset\tFull Model\tW/o Encoder\tW/o Coupling\tW/o post spike\tRNN")
print("-"*100)
for i, row in enumerate(table_rows):
    print(f"Data {i+1}\t{row[0]}\t{row[1]}\t{row[2]}\t{row[3]}\t{row[4]}")



Dataset	Full Model	W/o Encoder	W/o Coupling	W/o post spike	RNN
----------------------------------------------------------------------------------------------------
Data 1	0.20055 (0.00017)	0.20231 (0.00029)	0.20430 (0.00079)	0.20728 (0.00027)	0.20215 (0.00036)
Data 2	0.25223 (0.00008)	0.25344 (0.00012)	0.25621 (0.00012)	0.26715 (0.00046)	0.25244 (0.00017)
Data 3	0.05674 (0.00005)	0.05735 (0.00004)	0.05735 (0.00005)	0.05776 (0.00001)	0.05683 (0.00004)
