In [1]:
import sys
sys.path.append("../../src")
import torch
import matplotlib.pyplot as plt
import numpy as np
import torchvision
import torch.nn.functional as F

import glob
import os
from datetime import datetime
import time
import math
from tqdm import tqdm

from itertools import repeat
from torch.nn.parameter import Parameter
import collections
import matplotlib
from torch_utils import *
from ContrastiveModels import ContrastiveCorInfoMaxHopfield
from visualization import *
# matplotlib.use('Agg')

In [2]:
device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')
device

device(type='cuda', index=0)

In [3]:
transform = torchvision.transforms.Compose([torchvision.transforms.ToTensor(), 
                                            torchvision.transforms.Normalize(mean=(0.0,), std=(1.0,))])

mnist_dset_train = torchvision.datasets.MNIST('../../data', train=True, transform=transform, target_transform=None, download=True)
train_loader = torch.utils.data.DataLoader(mnist_dset_train, batch_size=20, shuffle=True, num_workers=0)

mnist_dset_test = torchvision.datasets.MNIST('../../data', train=False, transform=transform, target_transform=None, download=True)
test_loader = torch.utils.data.DataLoader(mnist_dset_test, batch_size=20, shuffle=False, num_workers=0)

In [4]:
# # Best Hyperparameters so far
# activation = hard_sigmoid
# architecture = [784, 500, 10]

# beta = 1
# lambda_ = 0.99999
# epsilon = 0.15
# one_over_epsilon = 1 / epsilon
# lr_start = {'ff' : np.array([1, 0.75]), 'fb': np.array([0.15, 0.12])}

# neural_lr_start = 0.05
# neural_lr_stop = 0.001
# neural_lr_rule = "constant"
# neural_lr_decay_multiplier = 0.01
# neural_dynamic_iterations_nudged = 5
# neural_dynamic_iterations_free = 30
# hopfield_g = 0.5
# use_random_sign_beta = True
# use_three_phase = False
# weight_decay = False

activation = hard_sigmoid
architecture = [784, 500, 10]

beta = 1
lambda_ = 0.99999
epsilon = 0.15
one_over_epsilon = 1 / epsilon
lr_start = {'ff' : np.array([0.75, 0.5]), 'fb': np.array([0.15, 0.15])}

neural_lr_start = 0.1
neural_lr_stop = 0.001
neural_lr_rule = "divide_by_slow_loop_index"
neural_lr_decay_multiplier = 0.01
neural_dynamic_iterations_nudged = 10
neural_dynamic_iterations_free = 30
hopfield_g = 0.5
use_random_sign_beta = True
use_three_phase = False
weight_decay = False


model = ContrastiveCorInfoMaxHopfield(architecture = architecture, lambda_ = lambda_, 
                                      epsilon = epsilon, activation = activation)

In [5]:
# _ = evaluateContrastiveCorInfoMaxHopfield(model, train_loader, hopfield_g,
#                                           neural_lr_start, neural_lr_stop, neural_lr_rule, 
#                                           neural_lr_decay_multiplier, neural_dynamic_iterations_free, device)

In [None]:
trn_acc_list = []
tst_acc_list = []

n_epochs = 50

for epoch_ in range(n_epochs):
    if epoch_ < 20:
        lr = {'ff' : lr_start['ff'] * (0.95)**epoch_, 'fb' : lr_start['fb'] * (0.95)**epoch_}
    else:
        lr = {'ff' : lr_start['ff'] * (0.9)**epoch_, 'fb' : lr_start['fb'] * (0.9)**epoch_}
    for idx, (x, y) in tqdm(enumerate(train_loader)):
        x, y = x.to(device), y.to(device)
        x = x.view(x.size(0),-1).T
        y_one_hot = F.one_hot(y, 10).to(device).T
        take_debug_logs_ = (idx % 500 == 0)
        if use_random_sign_beta:
            rnd_sgn = 2*np.random.randint(2) - 1
            beta = rnd_sgn*beta
            
        neurons = model.batch_step_hopfield( x, y_one_hot, hopfield_g, 
                                             lr, neural_lr_start, neural_lr_stop, neural_lr_rule, 
                                             neural_lr_decay_multiplier, neural_dynamic_iterations_free,
                                             neural_dynamic_iterations_nudged, beta, 
                                             use_three_phase, take_debug_logs_, weight_decay)
    
    trn_acc = evaluateContrastiveCorInfoMaxHopfield(model, train_loader, hopfield_g, neural_lr_start, 
                                                    neural_lr_stop, neural_lr_rule, 
                                                    neural_lr_decay_multiplier, 
                                                    neural_dynamic_iterations_free, 
                                                    device, printing = False)
    tst_acc = evaluateContrastiveCorInfoMaxHopfield(model, test_loader, hopfield_g, neural_lr_start, 
                                                    neural_lr_stop, neural_lr_rule, 
                                                    neural_lr_decay_multiplier, 
                                                    neural_dynamic_iterations_free, 
                                                    device, printing = False)
    trn_acc_list.append(trn_acc)
    tst_acc_list.append(tst_acc)
    
    print("Epoch : {}, Train Accuracy : {}, Test Accuracy : {}".format(epoch_+1, trn_acc, tst_acc))
    print("Free Information ratio: {}".format(np.array(model.layerwise_forward_corinfo_list_free)[-1] / np.array(model.layerwise_backward_corinfo_list_free)[-1]))
    print("Nudged Information ratio: {}".format(np.array(model.layerwise_forward_corinfo_list_nudged)[-1] / np.array(model.layerwise_backward_corinfo_list_nudged)[-1]))

3000it [01:22, 36.44it/s]
0it [00:00, ?it/s]

Epoch : 1, Train Accuracy : 0.9353833333333333, Test Accuracy : 0.9359
Free Information ratio: [0.17557825]
Nudged Information ratio: [0.17557802]


3000it [01:20, 37.13it/s]
0it [00:00, ?it/s]

Epoch : 2, Train Accuracy : 0.9585166666666667, Test Accuracy : 0.9569
Free Information ratio: [0.16412885]
Nudged Information ratio: [0.16412853]


3000it [01:54, 26.17it/s]
0it [00:00, ?it/s]

Epoch : 3, Train Accuracy : 0.9653166666666667, Test Accuracy : 0.9606
Free Information ratio: [0.17202327]
Nudged Information ratio: [0.17202288]


3000it [01:54, 26.26it/s]
0it [00:00, ?it/s]

Epoch : 4, Train Accuracy : 0.9709666666666666, Test Accuracy : 0.9668
Free Information ratio: [0.16112977]
Nudged Information ratio: [0.16112939]


3000it [01:56, 25.80it/s]
0it [00:00, ?it/s]

Epoch : 5, Train Accuracy : 0.9753, Test Accuracy : 0.9697
Free Information ratio: [0.13787219]
Nudged Information ratio: [0.13787177]


3000it [01:56, 25.83it/s]
0it [00:00, ?it/s]

Epoch : 6, Train Accuracy : 0.9761, Test Accuracy : 0.9713
Free Information ratio: [0.14424723]
Nudged Information ratio: [0.14424675]


3000it [01:56, 25.81it/s]
0it [00:00, ?it/s]

Epoch : 7, Train Accuracy : 0.9795833333333334, Test Accuracy : 0.9729
Free Information ratio: [0.12625156]
Nudged Information ratio: [0.12625114]


3000it [01:56, 25.84it/s]
0it [00:00, ?it/s]

Epoch : 8, Train Accuracy : 0.98185, Test Accuracy : 0.9737
Free Information ratio: [0.10159608]
Nudged Information ratio: [0.10159562]


3000it [01:56, 25.74it/s]
0it [00:00, ?it/s]

Epoch : 9, Train Accuracy : 0.9820666666666666, Test Accuracy : 0.974
Free Information ratio: [0.11026835]
Nudged Information ratio: [0.11026796]


3000it [01:51, 27.01it/s]
0it [00:00, ?it/s]

Epoch : 10, Train Accuracy : 0.9828833333333333, Test Accuracy : 0.9735
Free Information ratio: [0.10901001]
Nudged Information ratio: [0.1090096]


3000it [01:52, 26.70it/s]
0it [00:00, ?it/s]

Epoch : 11, Train Accuracy : 0.9832, Test Accuracy : 0.9717
Free Information ratio: [0.09267989]
Nudged Information ratio: [0.09267949]


3000it [01:51, 26.84it/s]
0it [00:00, ?it/s]

Epoch : 12, Train Accuracy : 0.9838, Test Accuracy : 0.9751
Free Information ratio: [0.08316297]
Nudged Information ratio: [0.08316256]


3000it [01:52, 26.73it/s]
0it [00:00, ?it/s]

Epoch : 13, Train Accuracy : 0.9843833333333334, Test Accuracy : 0.9757
Free Information ratio: [0.08987551]
Nudged Information ratio: [0.08987516]


3000it [01:46, 28.23it/s]
0it [00:00, ?it/s]

Epoch : 14, Train Accuracy : 0.9842666666666666, Test Accuracy : 0.9743
Free Information ratio: [0.08423819]
Nudged Information ratio: [0.08423783]


3000it [01:50, 27.12it/s]
0it [00:00, ?it/s]

Epoch : 15, Train Accuracy : 0.98515, Test Accuracy : 0.9757
Free Information ratio: [0.09005637]
Nudged Information ratio: [0.09005603]


3000it [01:51, 26.87it/s]
0it [00:00, ?it/s]

Epoch : 16, Train Accuracy : 0.9846333333333334, Test Accuracy : 0.9731
Free Information ratio: [0.07962025]
Nudged Information ratio: [0.07961992]


3000it [01:54, 26.09it/s]
0it [00:00, ?it/s]

Epoch : 17, Train Accuracy : 0.9853333333333333, Test Accuracy : 0.9748
Free Information ratio: [0.07310415]
Nudged Information ratio: [0.07310384]


3000it [01:55, 25.98it/s]
0it [00:00, ?it/s]

Epoch : 18, Train Accuracy : 0.9852, Test Accuracy : 0.9737
Free Information ratio: [0.0666756]
Nudged Information ratio: [0.06667531]


3000it [01:55, 25.94it/s]
0it [00:00, ?it/s]

Epoch : 19, Train Accuracy : 0.9847166666666667, Test Accuracy : 0.9721
Free Information ratio: [0.05854346]
Nudged Information ratio: [0.0585432]


3000it [01:55, 25.98it/s]
0it [00:00, ?it/s]

Epoch : 20, Train Accuracy : 0.9843, Test Accuracy : 0.9723
Free Information ratio: [0.06906918]
Nudged Information ratio: [0.06906892]


3000it [01:55, 26.04it/s]
0it [00:00, ?it/s]

Epoch : 21, Train Accuracy : 0.9842333333333333, Test Accuracy : 0.9735
Free Information ratio: [0.06715872]
Nudged Information ratio: [0.06715845]


3000it [01:55, 26.04it/s]
0it [00:00, ?it/s]

Epoch : 22, Train Accuracy : 0.9833833333333334, Test Accuracy : 0.9725
Free Information ratio: [0.06236535]
Nudged Information ratio: [0.0623651]


3000it [01:55, 25.95it/s]
0it [00:00, ?it/s]

Epoch : 23, Train Accuracy : 0.9839833333333333, Test Accuracy : 0.9732
Free Information ratio: [0.05484673]
Nudged Information ratio: [0.05484651]


3000it [01:55, 25.87it/s]
0it [00:00, ?it/s]

Epoch : 24, Train Accuracy : 0.98335, Test Accuracy : 0.9732
Free Information ratio: [0.05803598]
Nudged Information ratio: [0.05803577]


3000it [01:55, 25.86it/s]
0it [00:00, ?it/s]

Epoch : 25, Train Accuracy : 0.9823666666666667, Test Accuracy : 0.9704
Free Information ratio: [0.05803898]
Nudged Information ratio: [0.05803877]


3000it [01:21, 36.97it/s]
0it [00:00, ?it/s]

Epoch : 26, Train Accuracy : 0.98195, Test Accuracy : 0.9707
Free Information ratio: [0.05550101]
Nudged Information ratio: [0.05550079]


3000it [01:24, 35.29it/s]
0it [00:00, ?it/s]

Epoch : 27, Train Accuracy : 0.98075, Test Accuracy : 0.9703
Free Information ratio: [0.05886189]
Nudged Information ratio: [0.05886167]


3000it [01:21, 36.99it/s]
0it [00:00, ?it/s]

Epoch : 28, Train Accuracy : 0.9788666666666667, Test Accuracy : 0.9684
Free Information ratio: [0.05412788]
Nudged Information ratio: [0.05412767]


3000it [01:21, 36.98it/s]
0it [00:00, ?it/s]

Epoch : 29, Train Accuracy : 0.11236666666666667, Test Accuracy : 0.1135
Free Information ratio: [57.54456821]
Nudged Information ratio: [57.54456821]


3000it [01:20, 37.44it/s]
0it [00:00, ?it/s]

Epoch : 30, Train Accuracy : 0.11236666666666667, Test Accuracy : 0.1135
Free Information ratio: [596.89595796]
Nudged Information ratio: [596.89595796]


3000it [01:21, 36.88it/s]
0it [00:00, ?it/s]

Epoch : 31, Train Accuracy : 0.11236666666666667, Test Accuracy : 0.1135
Free Information ratio: [2162.2641039]
Nudged Information ratio: [2162.2641039]


3000it [01:25, 35.21it/s]
0it [00:00, ?it/s]

Epoch : 32, Train Accuracy : 0.11236666666666667, Test Accuracy : 0.1135
Free Information ratio: [5976.46338511]
Nudged Information ratio: [5976.46338511]


3000it [01:25, 35.27it/s]
0it [00:00, ?it/s]

Epoch : 33, Train Accuracy : 0.11236666666666667, Test Accuracy : 0.1135
Free Information ratio: [16124.45325634]
Nudged Information ratio: [16124.45325634]


3000it [01:20, 37.06it/s]
0it [00:00, ?it/s]

Epoch : 34, Train Accuracy : 0.11236666666666667, Test Accuracy : 0.1135
Free Information ratio: [42457.75316243]
Nudged Information ratio: [42457.75316243]


3000it [01:21, 36.99it/s]
0it [00:00, ?it/s]

Epoch : 35, Train Accuracy : 0.11236666666666667, Test Accuracy : 0.1135
Free Information ratio: [100198.41550665]
Nudged Information ratio: [100198.40585445]


3000it [01:20, 37.09it/s]
0it [00:00, ?it/s]

Epoch : 36, Train Accuracy : 0.11236666666666667, Test Accuracy : 0.1135
Free Information ratio: [178077.52733379]
Nudged Information ratio: [178077.52733379]


3000it [01:22, 36.29it/s]
0it [00:00, ?it/s]

Epoch : 37, Train Accuracy : 0.11236666666666667, Test Accuracy : 0.1135
Free Information ratio: [332282.71234711]
Nudged Information ratio: [332282.68140865]


76it [00:03, 25.57it/s]

In [None]:
plot_convergence_plot(trn_acc_list, xlabel = 'Number of Epochs', ylabel = 'Accuracy %',
                      title = 'Contrastive CorInfoMax Train Accuracy w.r.t. Epochs', 
                      figsize = (12,8), fontsize = 25, linewidth = 3)

In [None]:
plot_convergence_plot(tst_acc_list, xlabel = 'Number of Epochs', ylabel = 'Accuracy %',
                      title = 'Contrastive CorInfoMax Test Accuracy w.r.t. Epochs', 
                      figsize = (12,8), fontsize = 25, linewidth = 3)

In [None]:
# from IPython.display import Math, display
# ########### LATEX Style Display Matrix ###############
# def display_matrix(array):
#     """Display given numpy array with Latex format in Jupyter Notebook.
#     Args:
#         array (numpy array): Array to be displayed
#     """
#     data = ""
#     for line in array:
#         if len(line) == 1:
#             data += " %.3f &" % line + r" \\\n"
#             continue
#         for element in line:
#             data += " %.3f &" % element
#         data += r" \\" + "\n"
#     display(Math("\\begin{bmatrix} \n%s\\end{bmatrix}" % data))

In [None]:
# display_matrix(model.B[0]['weight'][:10,:10])

In [None]:
# display_matrix(torch.linalg.inv(model.Rh1)[:10,:10])

In [None]:
# torch.norm(model.B[0]['weight'] - torch.linalg.inv(model.Rh1))

In [None]:
# display_matrix(torch.linalg.inv(model.Rh2)[:10,:10])