# Finding best model with Gaussian Process Regression (GPR)

In [1]:
%load_ext autoreload
%autoreload 2

In [2]:
%matplotlib notebook

In [3]:
# import own modules
import run_gpr
from gpr_alg import plot_data

# import external modules
import warnings
import pandas as pd
import numpy as np
import sklearn.gaussian_process as gp

## Find best model

We start be performing a grid search to find the best model for the given dataset. The ouput is saved in a file.

In [4]:
# Load statistics from model fitting with different kernels
model_stats = pd.read_pickle('output/data/grid_search_stats_2D_100_iterations.pkl')
model_stats

model_stats

Unnamed: 0,kernel,stats,pred_mean,pred_cov
0,RBF: {'length_scale': 9.999999999999997e-06},0.100028,"[-0.421499462109478, 0.5101733594488375, 1.416...","[[1.4999997743903037e-07, 0.0, 0.0, 0.0, 0.0, ..."
6,RationalQuadratic: {'length_scale': 0.15913862...,0.000202,"[-0.4213950213516, 0.5098295751981823, 1.41672...","[[1.4942326675981832e-07, 2.4014882304967955e-..."
7,RationalQuadratic: {'length_scale': 0.15913854...,0.000202,"[-0.4213950212870259, 0.5098295749648969, 1.41...","[[1.494232663157291e-07, 2.4014920052550792e-0..."
8,RationalQuadratic: {'length_scale': 0.15913887...,0.000202,"[-0.42139502060763334, 0.5098295733528175, 1.4...","[[1.494232619858593e-07, 2.4015088806450535e-0..."
9,RationalQuadratic: {'length_scale': 0.15913857...,0.000202,"[-0.4213950215303157, 0.5098295756620246, 1.41...","[[1.4942326842515286e-07, 2.4014830124485798e-..."
10,RationalQuadratic: {'length_scale': 0.15729480...,0.000207,"[-0.4213947505691067, 0.5098275695791017, 1.41...","[[1.4941477755048282e-07, 2.4469027914975072e-..."
11,RationalQuadratic: {'length_scale': 0.15913860...,0.000202,"[-0.42139502123200145, 0.5098295748562123, 1.4...","[[1.494232658716399e-07, 2.401492893433499e-09..."
12,RBF + WhiteKernel: {'k1': RBF(length_scale=0.1...,0.001074,"[-0.42018575507188416, 0.506825004755342, 1.41...","[[1.5026264549522494e-05, 4.2079478435042006e-..."
13,RationalQuadratic + WhiteKernel: {'k1': Ration...,0.001069,"[-0.42018710332081355, 0.5068359025285645, 1.4...","[[1.5026467141243671e-05, 4.200481308336279e-0..."


In [5]:
# Sort dataframe
model_stats = model_stats.sort_values(by=['stats'])
model_stats

Unnamed: 0,kernel,stats,pred_mean,pred_cov
9,RationalQuadratic: {'length_scale': 0.15913857...,0.000202,"[-0.4213950215303157, 0.5098295756620246, 1.41...","[[1.4942326842515286e-07, 2.4014830124485798e-..."
6,RationalQuadratic: {'length_scale': 0.15913862...,0.000202,"[-0.4213950213516, 0.5098295751981823, 1.41672...","[[1.4942326675981832e-07, 2.4014882304967955e-..."
11,RationalQuadratic: {'length_scale': 0.15913860...,0.000202,"[-0.42139502123200145, 0.5098295748562123, 1.4...","[[1.494232658716399e-07, 2.401492893433499e-09..."
7,RationalQuadratic: {'length_scale': 0.15913854...,0.000202,"[-0.4213950212870259, 0.5098295749648969, 1.41...","[[1.494232663157291e-07, 2.4014920052550792e-0..."
8,RationalQuadratic: {'length_scale': 0.15913887...,0.000202,"[-0.42139502060763334, 0.5098295733528175, 1.4...","[[1.494232619858593e-07, 2.4015088806450535e-0..."
10,RationalQuadratic: {'length_scale': 0.15729480...,0.000207,"[-0.4213947505691067, 0.5098275695791017, 1.41...","[[1.4941477755048282e-07, 2.4469027914975072e-..."
13,RationalQuadratic + WhiteKernel: {'k1': Ration...,0.001069,"[-0.42018710332081355, 0.5068359025285645, 1.4...","[[1.5026467141243671e-05, 4.200481308336279e-0..."
12,RBF + WhiteKernel: {'k1': RBF(length_scale=0.1...,0.001074,"[-0.42018575507188416, 0.506825004755342, 1.41...","[[1.5026264549522494e-05, 4.2079478435042006e-..."
0,RBF: {'length_scale': 9.999999999999997e-06},0.100028,"[-0.421499462109478, 0.5101733594488375, 1.416...","[[1.4999997743903037e-07, 0.0, 0.0, 0.0, 0.0, ..."


In [6]:
for row in range(model_stats.shape[0]):
    print(model_stats['kernel'].iloc[row])

RationalQuadratic: {'length_scale': 0.15913857726527236, 'alpha': 152.52603529387923}
RationalQuadratic: {'length_scale': 0.15913862459150105, 'alpha': 152.52661317136554}
RationalQuadratic: {'length_scale': 0.15913860757995552, 'alpha': 152.53100675073813}
RationalQuadratic: {'length_scale': 0.15913854562471424, 'alpha': 152.53472939754778}
RationalQuadratic: {'length_scale': 0.15913887331469131, 'alpha': 152.52482797924992}
RationalQuadratic: {'length_scale': 0.15729480994376585, 'alpha': 99978.79394262172}
RationalQuadratic + WhiteKernel: {'k1': RationalQuadratic(alpha=622, length_scale=0.166), 'k2': WhiteKernel(noise_level=1e-05), 'k1__length_scale': 0.1660521052802018, 'k1__alpha': 622.2597381115439, 'k1__length_scale_bounds': (1e-05, 100000.0), 'k1__alpha_bounds': (1e-05, 100000.0), 'k2__noise_level': 9.999999999999997e-06, 'k2__noise_level_bounds': (1e-05, 100000.0)}
RBF + WhiteKernel: {'k1': RBF(length_scale=0.166), 'k2': WhiteKernel(noise_level=1e-05), 'k1__length_scale': 0.16

We discard the first two options beacause for both kernels at least one parameter is very close to the specified bounds. Moreover, with the third kernel the mean absolut error is still extremly low.

In [7]:
# Get model with smallest mean absolut error
mean_prediction =  model_stats['pred_mean'].iloc[0]
cov_prediction = model_stats['pred_cov'].iloc[0]

print('Kernel: ' + str(model_stats['kernel'].iloc[0]))
print('Mean absolut error: ' + str(model_stats['stats'].iloc[0]))

Kernel: RationalQuadratic: {'length_scale': 0.15913857726527236, 'alpha': 152.52603529387923}
Mean absolut error: 0.0002019931771002801


In [8]:
# Load grid and data
grid_x1, grid_x2, grid_train, full_grid, data_train, data = run_gpr.create_2D_data(add_noise=False)

applying conditions
train set size: 0.79


In [9]:
# Plot original data
plot_data.make_3D_surface_plot(x=grid_x1, y=grid_x2, z=data.reshape(np.shape(grid_x1)[0], np.shape(grid_x1)[1]), file_name='output/images/original_data.png')

<IPython.core.display.Javascript object>

In [10]:
# Plot fitted data
plot_data.make_3D_surface_plot(x=grid_x1, y=grid_x2, z=mean_prediction.reshape(np.shape(grid_x1)[0], np.shape(grid_x1)[1]), file_name='output/images/fitted_data.png')

<IPython.core.display.Javascript object>

In [11]:
error = abs(data.reshape(np.shape(grid_x1)[0], np.shape(grid_x1)[1]) - mean_prediction.reshape(np.shape(grid_x1)[0], np.shape(grid_x1)[1]))
# Plot error
plot_data.make_3D_contour_plot(x=grid_x1, y=grid_x2, z=error, add_train=True, x_train=grid_train[:,0], y_train=grid_train[:,1], file_name='output/images/error.png')

<IPython.core.display.Javascript object>

In [12]:
# Plot posteriors
posteriors = plot_data.plot_posteriors(x=grid_x1, y=grid_x2, z=data.reshape(np.shape(grid_x1)[0], np.shape(grid_x1)[1]), mean_pred=mean_prediction.flatten(),
                                               cov_pred=cov_prediction,
                                               posterior_nums=5, add_train_ind=False, x_train_val=grid_train, file_name='output/images/posteriors.png')

<IPython.core.display.Javascript object>

## Fit specific model