## Simple example of TuRBO-1

In [1]:
cd ..

/home/mattyshen/NNTuRBO


In [2]:
from nnturbo import NNTurbo1
import numpy as np
import torch
import math
import matplotlib
import matplotlib.pyplot as plt

## Set up an optimization problem class

In [3]:
class Levy:
    def __init__(self, dim=10):
        self.dim = dim
        self.lb = -5 * np.ones(dim)
        self.ub = 10 * np.ones(dim)
        
    def __call__(self, x):
        assert len(x) == self.dim
        assert x.ndim == 1
        assert np.all(x <= self.ub) and np.all(x >= self.lb)
        w = 1 + (x - 1.0) / 4.0
        val = np.sin(np.pi * w[0]) ** 2 + \
            np.sum((w[1:self.dim - 1] - 1) ** 2 * (1 + 10 * np.sin(np.pi * w[1:self.dim - 1] + 1) ** 2)) + \
            (w[self.dim - 1] - 1) ** 2 * (1 + np.sin(2 * np.pi * w[self.dim - 1])**2)
        return val

f = Levy(10)

## Create a Turbo optimizer instance

In [4]:
turbo1 = NNTurbo1(
    f=f,  # Handle to objective function
    lb=f.lb,  # Numpy array specifying lower bounds
    ub=f.ub,  # Numpy array specifying upper bounds
    n_init=20,  # Number of initial bounds from an Latin hypercube design
    max_evals = 1000,  # Maximum number of evaluations
    batch_size=10,  # How large batch size TuRBO uses
    verbose=True,  # Print information from each batch
    use_ard=True,  # Set to true if you want to use ARD for the GP kernel
    max_cholesky_size=2000,  # When we switch from Cholesky to Lanczos
    n_training_steps=50,  # Number of steps of ADAM to learn the hypers
    min_cuda=1024,  # Run on the CPU for small datasets
    device="cuda",  # "cpu" or "cuda"
    dtype="float64",  # float64 or float32
    prop=1.2,
    p=2
)

Using dtype = torch.float64 
Using device = cpu


# Run the optimization process

In [5]:
turbo1.optimize()

Starting from fbest = 12.81
k: 1000
(1200, 10) (1000, 10)
(1000, 10) (1000, 10)
k: 833
(1200, 10) (833, 10)
(833, 10) (833, 10)
40) New best: 9.919
k: 833
(1200, 10) (833, 10)
(833, 10) (833, 10)
k: 694
(1200, 10) (694, 10)
(694, 10) (694, 10)
60) New best: 6.093
k: 694
(1200, 10) (694, 10)
(694, 10) (694, 10)
70) New best: 3.956
k: 694
(1200, 10) (694, 10)
(694, 10) (694, 10)
k: 578
(1200, 10) (578, 10)
(578, 10) (578, 10)
k: 481
(1200, 10) (481, 10)
(481, 10) (481, 10)
k: 400
(1200, 10) (400, 10)
(400, 10) (400, 10)
k: 333
(1200, 10) (333, 10)
(333, 10) (333, 10)
k: 277
(1200, 10) (277, 10)
(277, 10) (277, 10)
k: 230
(1200, 10) (230, 10)
(230, 10) (230, 10)
k: 191
(1200, 10) (191, 10)
(191, 10) (191, 10)
150) New best: 3.629
k: 191
(1200, 10) (191, 10)
(191, 10) (191, 10)
160) New best: 3.082
k: 191
(1200, 10) (191, 10)
(191, 10) (191, 10)


KeyboardInterrupt: 

## Extract all evaluations from Turbo and print the best

In [None]:
X = turbo1.X  # Evaluated points
fX = turbo1.fX  # Observed values
ind_best = np.argmin(fX)
f_best, x_best = fX[ind_best], X[ind_best, :]

print("Best value found:\n\tf(x) = %.3f\nObserved at:\n\tx = %s" % (f_best, np.around(x_best, 3)))

## Plot the progress
Each trust region is independent and finds different solutions

In [None]:
fig = plt.figure(figsize=(7, 5))
matplotlib.rcParams.update({'font.size': 16})
plt.plot(fX, 'b.', ms=10)  # Plot all evaluated points as blue dots
plt.plot(np.minimum.accumulate(fX), 'r', lw=3)  # Plot cumulative minimum as a red line
plt.xlim([0, len(fX)])
plt.ylim([0, 30])
plt.title("10D Levy function")

plt.tight_layout()
plt.show()