- Default PSO parameters
- max_back=20

In [18]:
import random

import numpy as np
from sklearn.metrics import mean_squared_error
import matplotlib.pyplot as plt
import seaborn as sns

import tengp
import symreg
from gpbenchmarks import get_data

from experiment_settings import nguyen7_funset, pagie_funset, keijzer_funset, korns12_funset, vlad_funset

def plot_results(name, outs):
    print(name)
    costs = np.array(outs)
    print('min:', np.min(costs))
    print('mean:', np.mean(costs))
    print('median:', np.median(costs))
    print('variance:',np.var(costs))
    plt.figure()
    plt.title(name)
    sns.distplot(costs, kde=False);
    

def run_experiment(data_item, cost_function):
    results = []
    genes = []
    
    name, (x_train, y_train, x_test, y_test), params = data_item
    print(name)
    
    bounds = tengp.individual.IndividualBuilder(params).create().bounds[:]
    
    prob = pg.problem(cost_function(np.c_[x_train, np.ones(len(x_train))], y_train, params, bounds))
    
    pg.set_global_rng_seed(42)
    
    for i in range(3):
        print(i, end=',')
        algo = pg.algorithm(pg.pso(gen=20))
        algo.set_verbosity(1)
        pop = pg.population(prob, 50)
        pop = algo.evolve(pop)
        results.append(pop.champion_f[0])
        
        uda = algo.extract(pg.pso)
        
        genes.append(uda.get_log())
    
    return results, genes

In [2]:
import pygmo as pg

class cost_function:
    def __init__(self, X, Y, params, bounds):
        self.params = params
        self.bounds = bounds
        self.X = X
        self.Y = Y
    
    def fitness(self, x):      
        individual = tengp.individual.NPIndividual(list(x), self.bounds, self.params)
        
        pred = individual.transform(self.X)
        
        try:
            return [mean_squared_error(pred, self.Y)]
        except ValueError:
            return [10000000000]
        
    def get_bounds(self):
        return self.bounds

In [3]:
kw_params = {'real_valued': True, 'max_back': 20}

params_nguyen4 = tengp.Parameters(2, 1, 1, 50, nguyen7_funset, **kw_params)
params_nguyen7 = tengp.Parameters(2, 1, 1, 50, nguyen7_funset, **kw_params)
params_nguyen10 = tengp.Parameters(3, 1, 1, 50, nguyen7_funset, **kw_params)
params_pagie1  = tengp.Parameters(2, 1, 1, 50, pagie_funset, **kw_params)
params_keijzer6 = tengp.Parameters(2, 1, 1, 50, keijzer_funset, **kw_params)
params_korns = tengp.Parameters(6, 1, 1, 50, korns12_funset, **kw_params)
params_vlad = tengp.Parameters(6, 1, 1, 50, vlad_funset, **kw_params)

all_params = [params_nguyen7, params_pagie1, params_keijzer6, params_korns, params_vlad]

In [4]:
import random 

data = [
    ('nguyen4', symreg.get_benchmark_poly(random, 6), params_nguyen4),
    ('nguyen7', symreg.get_benchmark_nguyen7(random, None), params_nguyen7),
    ('nguyen10', symreg.get_benchmark_nguyen10(random, None), params_nguyen10),
    ('pagie1', symreg.get_benchmark_pagie1(random, None), params_pagie1),
    ('keijzer6', symreg.get_benchmark_keijzer(random, 6), params_keijzer6),
    ('korns12', symreg.get_benchmark_korns(random, 12), params_korns),
    ('vladislasleva4', symreg.get_benchmark_vladislasleva4(random, None), params_vlad)
]

In [33]:
OUTPUT_FOLDER = 'results/pso_default_20_demo/'

# Nguyen 4

In [19]:
%%time

ng4_res, ng4_log = run_experiment(data[0], cost_function)

nguyen4
0,1,2,CPU times: user 3.8 s, sys: 31.2 ms, total: 3.83 s
Wall time: 3.88 s


In [35]:
import pickle

pickle.dump(ng4_res, open(f'{OUTPUT_FOLDER}ng4_res_100_000evals', 'wb'))
pickle.dump(ng4_log, open(f'{OUTPUT_FOLDER}ng4_log_100_000evals', 'wb'))

# Nguyen 7


In [39]:
%%time

ng7_res, ng7_log = run_experiment(data[1], cost_function)

nguyen7
0,1,2,CPU times: user 3.98 s, sys: 15.6 ms, total: 4 s
Wall time: 4.07 s


In [40]:
pickle.dump(ng7_res, open(f'{OUTPUT_FOLDER}ng7_res_100_000evals', 'wb'))
pickle.dump(ng7_log, open(f'{OUTPUT_FOLDER}ng7_log_100_000evals', 'wb'))

# Nguyen 10

In [41]:
%%time

ng10_res, ng10_log = run_experiment(data[2], cost_function)

nguyen10
0,1,2,CPU times: user 4.25 s, sys: 31.2 ms, total: 4.28 s
Wall time: 4.33 s


In [42]:
pickle.dump(ng10_res, open(f'{OUTPUT_FOLDER}ng10_res_100_000evals', 'wb'))
pickle.dump(ng10_log, open(f'{OUTPUT_FOLDER}ng10_log_100_000evals', 'wb'))

# Pagie

In [43]:
%%time

pag1_res, pag1_log = run_experiment(data[3], cost_function)

pagie1
0,

  l = (1-a)*f_l(L, U)
  return  np.sqrt(x)
  l = (1-a)*f_l(L, U)
  l = (1-a)*f_l(L, U)
  u = a*f_u(L, U)
  return np.divide(x, y, out=np.copy(x), where=x!=0)
  u = a*f_u(L, U)
  return l + u
  return np.log(x, out=np.copy(x), where=x>0)
  u = a*f_u(L, U)
  u = a*f_u(L, U)
  l = (1-a)*f_l(L, U)
  value = (1-coeff)*self.nodes[lower].value + coeff*self.nodes[upper].value
  U = (1-c)*x_l2 + c*x_u2
  L = (1-b)*x_l1 + b*x_u1
  l = (1-a)*f_l(L, U)
  U = (1-c)*x_l2 + c*x_u2
  L = (1-b)*x_l1 + b*x_u1
  u = a*f_u(L, U)
  return np.divide(x, y, out=np.copy(x), where=x!=0)
  return np.divide(x, y, out=np.copy(x), where=x!=0)
  l = (1-a)*f_l(L, U)
  value = (1-coeff)*self.nodes[lower].value + coeff*self.nodes[upper].value
  return x**(-1)
  l = (1-a)*f_l(L, U)
  u = a*f_u(L, U)


1,

  u = a*f_u(L, U)


2,

  return umr_sum(a, axis, dtype, out, keepdims)
  l = (1-a)*f_l(L, U)
  u = a*f_u(L, U)


CPU times: user 5.8 s, sys: 0 ns, total: 5.8 s
Wall time: 5.95 s


In [44]:
pickle.dump(pag1_res, open(f'{OUTPUT_FOLDER}pag1_res_100_000evals', 'wb'))
pickle.dump(pag1_log, open(f'{OUTPUT_FOLDER}pag1_log_100_000evals', 'wb'))

# Keijzer 6

In [46]:
%%time

kei6_res, kei6_log = run_experiment(data[4], cost_function)

pickle.dump(kei6_res, open(f'{OUTPUT_FOLDER}kei6_res_100_000evals', 'wb'))
pickle.dump(kei6_log, open(f'{OUTPUT_FOLDER}kei6_log_100_000evals', 'wb'))

keijzer6
0,

  return  np.sqrt(x)
  return np.log(x, out=np.copy(x), where=x>0)


1,2,CPU times: user 3.95 s, sys: 31.2 ms, total: 3.98 s
Wall time: 4.04 s


# Korns 12

In [47]:
%%time

korns12_res, korns12_log = run_experiment(data[5], cost_function)

pickle.dump(korns12_res, open(f'{OUTPUT_FOLDER}korns12_res_100_000evals', 'wb'))
pickle.dump(korns12_log, open(f'{OUTPUT_FOLDER}korns12_log_100_000evals', 'wb'))

korns12
0,

  return  np.sqrt(x)
  return np.exp(x)
  return np.log(x, out=np.copy(x), where=x>0)
  return x**2
  return x**3
  return l + u
  return np.sin(x)
  l = (1-a)*f_l(L, U)
  return np.divide(x, y, out=np.copy(x), where=x!=0)
  return np.cos(x)
  return np.tan(x)
  u = a*f_u(L, U)
  l = (1-a)*f_l(L, U)
  u = a*f_u(L, U)
  U = (1-c)*x_l2 + c*x_u2
  L = (1-b)*x_l1 + b*x_u1
  value = (1-coeff)*self.nodes[lower].value + coeff*self.nodes[upper].value
  value = (1-coeff)*self.nodes[lower].value + coeff*self.nodes[upper].value
  l = (1-a)*f_l(L, U)
  L = (1-b)*x_l1 + b*x_u1
  U = (1-c)*x_l2 + c*x_u2
  u = a*f_u(L, U)
  u = a*f_u(L, U)
  return umr_sum(a, axis, dtype, out, keepdims)
  output_errors = np.average((y_true - y_pred) ** 2, axis=0,
  value = (1-coeff)*self.nodes[lower].value + coeff*self.nodes[upper].value
  return np.divide(x, y, out=np.copy(x), where=x!=0)


1,

  l = (1-a)*f_l(L, U)


2,CPU times: user 48.4 s, sys: 1.06 s, total: 49.5 s
Wall time: 50 s


# Vladislasleva 4

In [48]:
%%time

vlad4_res, vlad4_log = run_experiment(data[6], cost_function)

pickle.dump(vlad4_res, open(f'{OUTPUT_FOLDER}vlad4_res_100_000evals', 'wb'))
pickle.dump(vlad4_log, open(f'{OUTPUT_FOLDER}vlad4_log_100_000evals', 'wb'))

vladislasleva4
0,

  u = a*f_u(L, U)
  return  np.sqrt(x)
  return np.log(x, out=np.copy(x), where=x>0)
  return np.exp(x)
  l = (1-a)*f_l(L, U)
  u = a*f_u(L, U)
  return np.sin(x)
  return np.cos(x)
  l = (1-a)*f_l(L, U)
  u = a*f_u(L, U)
  return l + u
  l = (1-a)*f_l(L, U)
  return np.divide(x, y, out=np.copy(x), where=x!=0)
  l = (1-a)*f_l(L, U)
  U = (1-c)*x_l2 + c*x_u2
  u = a*f_u(L, U)
  value = (1-coeff)*self.nodes[lower].value + coeff*self.nodes[upper].value
  L = (1-b)*x_l1 + b*x_u1
  value = (1-coeff)*self.nodes[lower].value + coeff*self.nodes[upper].value
  U = (1-c)*x_l2 + c*x_u2
  L = (1-b)*x_l1 + b*x_u1
  return umr_sum(a, axis, dtype, out, keepdims)
  u = a*f_u(L, U)
  return np.divide(x, y, out=np.copy(x), where=x!=0)
  l = (1-a)*f_l(L, U)
  u = a*f_u(L, U)
  return x**(-1)
  return np.divide(x, y, out=np.copy(x), where=x!=0)
  output_errors = np.average((y_true - y_pred) ** 2, axis=0,
  l = (1-a)*f_l(L, U)
  u = a*f_u(L, U)
  l = (1-a)*f_l(L, U)


1,

  u = a*f_u(L, U)


2,CPU times: user 6.53 s, sys: 46.9 ms, total: 6.58 s
Wall time: 6.59 s
