In [2]:
import numpy as np
import matplotlib.pyplot as plt

In [3]:
%matplotlib notebook

In [4]:
def dataset_generator(init, end, sample, mean, var, function):
    """
    Return X,Y,t being:
    x input
    y deterministic output
    t data with noise
    """
    sample = int(sample)
    x = (np.array([np.linspace(init,end,sample)])).T
    y = (function(x))
    e = (np.array([np.random.normal(mean,var,sample)])).T
    t = y + e

    return x,y,t,e

In [5]:
def design_matrix(x,function,m):
    """
    Return the Phi matrix
    """  
    phi = np.zeros((len(x),m))
    mu = np.array([np.linspace(min(x),max(x),m)]).T
    for i in range(len(x)):
        for j in range(m):
            phi[i][j] = function(x[i],mu[j])    
    return phi

In [6]:
def fit(phi,t):
    """
    Return the model trained, i.e., W vector
    """
    w = np.linalg.pinv(phi)@t
    return w

In [7]:
def fit_l(phi,t,lda):
    """
    Return the model trained, i.e., W vector
    """
    I = np.identity(len(phi))
    
    w = phi.T@np.linalg.inv(lda*I+phi@phi.T)@t
    return w

In [8]:
def predict(phi,w):
    return phi@w

In [9]:
def split_data(x,t):
    from math import floor
    n = floor(len(x)/3)
    x_train , x_valid , x_test = x[0:n], x[n:2*n] , x[2*n:-1]
    t_train , t_valid , t_test = t[0:n], t[n:2*n] , t[2*n:-1]
    
    return x_train , x_valid , x_test, t_train , t_valid , t_test
    

In [10]:
def f_deterministic(x):
    """
    Return the deterministic function.
    """
    return 2*np.sin(np.pi*x) + 0*x

In [11]:
def f_basis(x,mu,s=1):
    """
    Return gaussian function with var = 1.
    """
    return np.e**(-(x-mu)**2 / s**2)   

#### Initializing

In [12]:
x,y,t,e = dataset_generator(0,12,100,0,0.8*2,f_deterministic)

In [13]:
plt.figure();
plt.plot(x,y,label='Deterministic');
plt.plot(x,t,'o',label='Data',markerfacecolor="None");
plt.legend();

<IPython.core.display.Javascript object>

m = 500;
phi = np.zeros((len(x),m))
mu = np.array([np.linspace(min(x),max(x),m)]).T
for i in range(len(x)):
    for j in range(m):
        phi[i][j] = f_basis(x[i],mu[j])
w = np.linalg.pinv(phi)@t
y_pred = phi@w

print(x.shape,t.shape,y_pred.shape)

In [14]:
phi = design_matrix(x,f_basis,len(x))
w = fit(phi,t)
y_pred = predict(phi,w)

In [15]:
plt.figure();
plt.plot(x,y,label='Deterministic');
plt.plot(x,t,'o',label='Data',markerfacecolor="None");
plt.plot(x,y_pred,'+',label='Prediction',markerfacecolor="None");
plt.legend();

<IPython.core.display.Javascript object>

In [16]:
x_train, x_valid, x_test, t_train, t_valid, t_test = split_data(x, t)

In [17]:
print(x_train.shape)
print(x_valid.shape)
print(x_test.shape)

(33, 1)
(33, 1)
(33, 1)


In [18]:
Error_train = [];
Error_valid = [];

#Concat Train and Validation X
x0 = np.append(x_train,x_valid)
x0 = np.reshape(x0,(len(x0),1))

#Concat Train and Validation T
t0 = np.append(t_train,t_valid)
t0 = np.reshape(t0,(len(t0),1))

for i in range(200):
    
    #Calculate train
    phi = design_matrix(x_train,f_basis,len(x_train))
    w = fit_l(phi,t_train,i)
    y_train = predict(phi,w)
    
    #Calculate validation
    phi_v = design_matrix(x_valid,f_basis,len(x_train))
    y_valid = predict(phi_v,w) 
    
    E_train = (sum((y_train - t_train) ** 2) / len(y_train)) ** 0.5
    E_valid = (sum((y_valid - t_valid) ** 2) / len(y_valid)) ** 0.5
    Error_train = np.append(Error_train,E_train)
    Error_valid = np.append(Error_valid,E_valid)
    
    #plt.figure()
    #plt.plot(x0,y_valid);
minimum = int(np.argmin(Error_train))

plt.figure()
plt.plot(np.arange(200),Error_valid,label="Validation");
plt.plot(np.arange(200),Error_train,label="Train");
#plt.yscale('log');
plt.xlim((0,40));
plt.legend();

<IPython.core.display.Javascript object>

In [19]:
interval = np.logspace(-26,12,1e3)
Error_train = [];
Error_valid = [];

#Concat Train and Validation X
x0 = np.append(x_train,x_valid)
x0 = np.reshape(x0,(len(x0),1))

#Concat Train and Validation T
t0 = np.append(t_train,t_valid)
t0 = np.reshape(t0,(len(t0),1))

for i in range(1000):
    
    #Calculate train
    phi = design_matrix(x_train,f_basis,len(x_train))
    w = fit_l(phi,t_train,interval[i])
    y_train = predict(phi,w)
    
    #Calculate validation
    phi_v = design_matrix(x_valid,f_basis,len(x_train))
    y_valid = predict(phi_v,w) 
    
    E_train = (sum((y_train - t_train) ** 2) / len(y_train)) ** 0.5
    E_valid = (sum((y_valid - t_valid) ** 2) / len(y_valid)) ** 0.5
    Error_train = np.append(Error_train,E_train)
    Error_valid = np.append(Error_valid,E_valid)
    
    #plt.figure()
    #plt.plot(x0,y_valid);

plt.figure()
plt.plot(interval,Error_valid,label="Validation");
plt.plot(interval,Error_train,label="Train");
plt.yscale('log');
plt.xscale('log');
#plt.xlim((0,40));
plt.legend();

<IPython.core.display.Javascript object>