In [1]:
import sys
sys.path.append("../../src")
import torch
import matplotlib.pyplot as plt
import numpy as np
import torchvision
import torch.nn.functional as F

import glob
import os
from datetime import datetime
import time
import math
from tqdm import tqdm

from itertools import repeat
from torch.nn.parameter import Parameter
import collections
import matplotlib
from torch_utils import *
from ContrastiveModels import ContrastiveCorInfoMaxHopfield
from visualization import *
from dataset import get_boston_housing_dataset_pytorch
# matplotlib.use('Agg')

In [11]:
device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')
device = "cpu"
device

'cpu'

In [12]:
train_loader, test_loader, maximum_label_value = get_boston_housing_dataset_pytorch(batch_size = 5, seed = 10)

In [13]:
x, y = next(iter(train_loader))
x.shape

torch.Size([5, 13])

In [14]:
activation = hard_sigmoid
architecture = [13, 13, 1]

beta = 1
lambda_ = 0.99995
epsilon = 0.15
one_over_epsilon = 1 / epsilon
lr_start = {'ff' : np.array([0.3, 0.15]), 'fb': np.array([0.15, 0.1])}

neural_lr_start = 0.05
neural_lr_stop = 0.001
neural_lr_rule = "constant"
neural_lr_decay_multiplier = 0.01
neural_dynamic_iterations_nudged = 10
neural_dynamic_iterations_free = 30
hopfield_g = 0.1
use_random_sign_beta = True
use_three_phase = False
weight_decay = False

model = ContrastiveCorInfoMaxHopfield(architecture = architecture, lambda_ = lambda_, 
                                      epsilon = epsilon, activation = activation, device = device)

In [15]:
trn_rmse_list = []
tst_rmse_list = []
debug_iteration_point = 1
n_epochs = 25

for epoch_ in range(n_epochs):
    lr = {'ff' : lr_start['ff'] * (0.99)**epoch_, 'fb' : lr_start['fb'] * (0.99)**epoch_}
    for idx, (x, y) in tqdm(enumerate(train_loader)):
        x, y = x.to(device).T, y.to(device).T
        take_debug_logs_ = (idx % 500 == 0)
        if use_random_sign_beta:
            rnd_sgn = 2*np.random.randint(2) - 1
            beta = rnd_sgn*beta
            
        neurons = model.batch_step_hopfield( x, y, hopfield_g, 
                                             lr, neural_lr_start, neural_lr_stop, neural_lr_rule, 
                                             neural_lr_decay_multiplier, neural_dynamic_iterations_free,
                                             neural_dynamic_iterations_nudged, beta, 
                                             use_three_phase, take_debug_logs_, weight_decay)
    
    if epoch_ % debug_iteration_point == 0:
        ## Train Evaluations
        gt_list = []
        pred_list = []
        for x, y in train_loader:
            x, y = x.to(device).T, y.to(device).T
            neurons = model.init_neurons(x.size(1), device = device)
            (neurons,
             _,
             _
             ) = model.run_neural_dynamics_hopfield(x, y, neurons, hopfield_g, neural_lr_start, neural_lr_stop, neural_lr_rule, 
                                                    neural_lr_decay_multiplier, neural_dynamic_iterations_free, 0, False)
            output = neurons[-1]
            gt_list += (list(maximum_label_value*torch2numpy(y).reshape(-1,)))
            pred_list += (list(maximum_label_value*torch2numpy(output).reshape(-1,)))
        train_RMSE = np.sqrt(((np.array(gt_list) - np.array(pred_list)) ** 2).mean())
        trn_rmse_list.append(train_RMSE)
        ## Test Evaluation

        gt_list = []
        pred_list = []
        for x, y in test_loader:
            x, y = x.to(device).T, y.to(device).T
            neurons = model.init_neurons(x.size(1), device = device)
            (neurons,
             _,
             _
             ) = model.run_neural_dynamics_hopfield(x, y, neurons, hopfield_g, neural_lr_start, neural_lr_stop, neural_lr_rule, 
                                                    neural_lr_decay_multiplier, neural_dynamic_iterations_free, 0, False)
            output = neurons[-1]
            gt_list += (list(maximum_label_value*torch2numpy(y).reshape(-1,)))
            pred_list += (list(maximum_label_value*torch2numpy(output).reshape(-1,)))

        test_RMSE = np.sqrt(((np.array(gt_list) - np.array(pred_list)) ** 2).mean())
        tst_rmse_list.append(test_RMSE)
        
        print("Train RMSE : {}, Test RMSE : {}".format(train_RMSE, test_RMSE))

81it [00:02, 35.98it/s]


RuntimeError: Expected all tensors to be on the same device, but found at least two devices, cpu and cuda:0! (when checking argument for argument mat2 in method wrapper_mm)

In [16]:
model.Wff[0]['weight']

tensor([[-0.0585,  0.1625, -0.1054, -0.1475, -0.0787,  0.3325,  0.0314,  0.1486,
         -0.3368,  0.2345,  0.1331, -0.0627,  0.0902],
        [ 0.2215,  0.4429,  0.1801,  0.2422,  0.0301, -0.3304,  0.2547,  0.3777,
          0.4361, -0.2082,  0.3957,  0.2056,  0.0536],
        [-0.3442,  0.4713, -0.2985,  0.3816, -0.1980,  0.0536, -0.0799,  0.2819,
         -0.2043,  0.4628,  0.4668,  0.3641, -0.1129],
        [ 0.0444, -0.1992,  0.1594, -0.3471, -0.4588, -0.0048,  0.2268, -0.0896,
         -0.4690,  0.2970, -0.2099, -0.2760,  0.1615],
        [-0.1262, -0.4450,  0.1260, -0.1497, -0.1387,  0.1112, -0.4513, -0.3621,
          0.3457, -0.1150, -0.1068,  0.2249,  0.4742],
        [-0.4536, -0.3350,  0.0205,  0.4398,  0.3789,  0.2073, -0.1373,  0.3314,
          0.3517,  0.3702,  0.2460,  0.3980, -0.4394],
        [ 0.2998, -0.3453, -0.2282,  0.4612, -0.1155, -0.4239,  0.2718, -0.0743,
          0.4459,  0.4687, -0.2242, -0.4357,  0.1905],
        [-0.2259, -0.4543, -0.3804,  0.0122,  0.

In [17]:
device

'cpu'

In [None]:
plot_convergence_plot(trn_acc_list, xlabel = 'Number of Epochs', ylabel = 'Accuracy %',
                      title = 'Contrastive CorInfoMax Train Accuracy w.r.t. Epochs', 
                      figsize = (12,8), fontsize = 25, linewidth = 3)

In [None]:
plot_convergence_plot(tst_acc_list, xlabel = 'Number of Epochs', ylabel = 'Accuracy %',
                      title = 'Contrastive CorInfoMax Test Accuracy w.r.t. Epochs', 
                      figsize = (12,8), fontsize = 25, linewidth = 3)

In [None]:
# from IPython.display import Math, display
# ########### LATEX Style Display Matrix ###############
# def display_matrix(array):
#     """Display given numpy array with Latex format in Jupyter Notebook.
#     Args:
#         array (numpy array): Array to be displayed
#     """
#     data = ""
#     for line in array:
#         if len(line) == 1:
#             data += " %.3f &" % line + r" \\\n"
#             continue
#         for element in line:
#             data += " %.3f &" % element
#         data += r" \\" + "\n"
#     display(Math("\\begin{bmatrix} \n%s\\end{bmatrix}" % data))

In [None]:
# display_matrix(model.B[0]['weight'][:10,:10])

In [None]:
# display_matrix(torch.linalg.inv(model.Rh1)[:10,:10])

In [None]:
# torch.norm(model.B[0]['weight'] - torch.linalg.inv(model.Rh1))

In [None]:
# display_matrix(torch.linalg.inv(model.Rh2)[:10,:10])