In [1]:
import numpy as np
import sklearn
import os
import random
import math
import pickle

from tqdm import tqdm
from scipy.io import loadmat

np.random.seed(1)
import matplotlib.pyplot as plt

from sklearn.metrics import mean_squared_error


In [2]:
loaded_data = pickle.load(open("adaptive_data2.pickle", 'rb'))
X = loaded_data["X"]
Y = loaded_data["Y"]

In [3]:
data = np.concatenate([X, Y.reshape((151, 1))], axis=1)
np.random.shuffle(data)

train  = data[:50, :]
validation = data[50:100, :]
test = data[100:150, :]


X_train = train[:, 0:2]
Y_train = train[:, 2]

X_valid = validation[:, 0:2]
Y_valid = validation[:, 2]


X_test  = test[:, 0:2]
Y_test  = test[:, 2]



In [4]:
Data1 = {
    "X_train" : X_train,
    "Y_train" : Y_train,
    "X_valid" : X_valid,
    "Y_valid" : Y_valid,
    "X_test"  : X_test,
    "Y_test"  : Y_test
}

pickle.dump(Data1, open("Data/Data1.pickle", 'wb'))


# Hyperparameters

In [None]:
Sigma_u = math.pow(10, -1.5)*np.identity(2)
C_term  = 1
Noise_variance = 1e-3

# Gaussian Process fit and predict

In [None]:
def Kernel(x1, x2):  # K_input part of ICM kernel
    numerator    = 2*np.dot(np.dot(x1, Sigma_u), x2 )
    denominator1 = 1 + 2*np.dot(np.dot(x1, Sigma_u), x1 )
    denominator2 = 1 + 2*np.dot(np.dot(x2, Sigma_u), x2 )
    denominator  = math.sqrt(denominator1*denominator2) # See "Computing with infinite networks" for calculation of Expectation term 
    
    Expectation_term = (2/np.pi) * math.asin( numerator/denominator )
    similarity       = C_term +  Expectation_term  # See "Multitask Neural networks meet Multitask Gaussian Process" Paper for notation of C-term and Expectation term
    return similarity 




def mtgp_fit (X_train, Y_train, Noise_variance ): 
    N = len(X_train)
    K = np.zeros((N, N))
            
    for i in range(0, N):
        for j in range(0, N):
            K[i, j] = Kernel(X_train[i],  X_train[j] )
            
    B = np.zeros((N, N))
    for i in range(0, N):
        B[i, i] = Noise_variance
         
    
    C = K + B
    C_inv = np.linalg.inv(C)
    alpha = np.dot(C_inv, Y_train)
    model = {
        "X_train" :  X_train,
        "Y_train" :  Y_train,
        "Noise_variance" : Noise_variance,
        "C_inv"   :  C_inv,
        "alpha"   :  alpha,
    }
    
    return model



def mtgp_predict(X,  model):
    
    n_train  = len(model["X_train"])
    n        = len(X)
    K        = np.zeros((n_train, n))
    
    for i in range(0, n_train):
        for j in range(0, n):
            K[i, j] = Kernel( model["X_train"][i],  X[j] )
            
    y_pred = np.dot(K.T, model["alpha"] )
    return y_pred




def get_stats (y_true, y_predict):
    msr = mean_squared_error(y_true, y_predict)
    stats ={
        "msr" : msr
    }
    
    return stats



In [None]:
model = mtgp_fit (X_train, Y_train, Noise_variance )
predict = mtgp_predict(X_valid,  model)
stats = get_stats(Y_valid, predict)
print("Validation Loss with True Hyperparameters :", stats['msr'])

Validation Loss with True Hyperparameters : 0.0012524983745783797


In [None]:
def get_Negative_Loss (
    Sigma_u_temp, noise_variance_temp
):
    global Sigma_u
    global Noise_variance
    
    Sigma_u = math.pow(10, Sigma_u_temp)*np.identity(2)
    Noise_variance = math.pow(10, noise_variance_temp)
    
    model = mtgp_fit (X_train, Y_train, Noise_variance )
    predict = mtgp_predict(X_valid,  model)
    stats = get_stats(Y_valid, predict)
    return -stats['msr']


In [None]:
from bayes_opt import BayesianOptimization


pbounds = {
            "Sigma_u_temp" : (-4, 2),
            "noise_variance_temp" : (-6, 0),
          }



optimizer = BayesianOptimization(
    f= get_Negative_Loss,
    pbounds=pbounds,
    random_state=1,
)


In [None]:
optimizer.maximize(
    init_points=200,
    n_iter=100,
)

|   iter    |  target   | Sigma_... | noise_... |
-------------------------------------------------
| [0m 1       [0m | [0m-0.001366[0m | [0m-1.498   [0m | [0m-1.678   [0m |
| [0m 2       [0m | [0m-0.02753 [0m | [0m-3.999   [0m | [0m-4.186   [0m |
| [0m 3       [0m | [0m-0.006324[0m | [0m-3.119   [0m | [0m-5.446   [0m |
| [0m 4       [0m | [0m-0.004972[0m | [0m-2.882   [0m | [0m-3.927   [0m |
| [95m 5       [0m | [95m-0.001274[0m | [95m-1.619   [0m | [95m-2.767   [0m |
| [0m 6       [0m | [0m-0.001285[0m | [0m-1.485   [0m | [0m-1.889   [0m |
| [0m 7       [0m | [0m-0.02218 [0m | [0m-2.773   [0m | [0m-0.7313  [0m |
| [0m 8       [0m | [0m-0.02674 [0m | [0m-3.836   [0m | [0m-1.977   [0m |
| [95m 9       [0m | [95m-0.001224[0m | [95m-1.496   [0m | [95m-2.648   [0m |
| [0m 10      [0m | [0m-0.005824[0m | [0m-3.158   [0m | [0m-4.811   [0m |
| [0m 11      [0m | [0m-0.001818[0m | [0m 0.8045  [0m | [0m-0.190

| [0m 103     [0m | [0m-0.001281[0m | [0m-1.66    [0m | [0m-3.084   [0m |
| [0m 104     [0m | [0m-0.001251[0m | [0m-0.3741  [0m | [0m-2.703   [0m |
| [0m 105     [0m | [0m-0.001398[0m | [0m 1.557   [0m | [0m-0.4876  [0m |
| [0m 106     [0m | [0m-0.007202[0m | [0m-1.631   [0m | [0m-0.2204  [0m |
| [0m 107     [0m | [0m-0.005572[0m | [0m-2.956   [0m | [0m-5.242   [0m |
| [0m 108     [0m | [0m-0.02048 [0m | [0m-3.19    [0m | [0m-2.966   [0m |
| [0m 109     [0m | [0m-0.08294 [0m | [0m-3.871   [0m | [0m-0.3122  [0m |
| [0m 110     [0m | [0m-0.01903 [0m | [0m 0.9627  [0m | [0m-5.91    [0m |
| [0m 111     [0m | [0m-0.005039[0m | [0m-2.943   [0m | [0m-4.008   [0m |
| [0m 112     [0m | [0m-0.02487 [0m | [0m-3.214   [0m | [0m-1.143   [0m |
| [0m 113     [0m | [0m-0.01071 [0m | [0m-1.932   [0m | [0m-0.3594  [0m |
| [0m 114     [0m | [0m-0.001741[0m | [0m-0.5079  [0m | [0m-0.727   [0m |
| [0m 115     

| [0m 203     [0m | [0m-0.001334[0m | [0m 1.999   [0m | [0m-0.5416  [0m |
| [0m 204     [0m | [0m-0.002193[0m | [0m-2.23    [0m | [0m-3.642   [0m |


In [None]:
print(optimizer.max)

In [None]:
Sigma_u = math.pow(10, -1.5)*np.identity(2)
C_term  = 1
Noise_variance = 1e-3



model = mtgp_fit (X_train, Y_train, Noise_variance )
predict = mtgp_predict(X_test,  model)
stats = get_stats(Y_test, predict)
print("Test Loss with True Hyperparameters : ", stats['msr'])



Sigma_u = math.pow(10, optimizer.max['params']["Sigma_u_temp"] )*np.identity(2)
C_term  = 1
Noise_variance = math.pow(10, optimizer.max['params']["noise_variance_temp"]  )


model = mtgp_fit (X_train, Y_train, Noise_variance )
predict = mtgp_predict(X_test,  model)
stats = get_stats(Y_test, predict)
print("Test Loss with BO Hyperparameters : ", stats['msr'])