# Santa Fe Benchmark, ProbM

In [1]:
from pycgp.benchmarks.santafe import PARAMS, EV_PARAMS, X, santafe_cost_function
from pycgp.evolution import evolution
import numpy as np
import random

In [2]:
def run_experiment(params, ev_params, x):
    rstat = []
    for i in range(0, 20):
        print(i, end=', ')

        result = evolution(PARAMS, EV_PARAMS, X, None)

        rstat.append([santafe_cost_function(None, individual.execute(X)) for individual in result['final']])
    
    #print('Best fitness: {}'.format(np.min(stats)))
    #print('mean and std of fitness of last generation: {}, {}'.format(np.mean(stats), np.std(stats)))
    #print('Mean and std of best fitness: {}, {}'.format(np.mean(np.min(stats, axis=1)), np.std(np.min(stats, axis=1))))
    # best fitness, mean of last generation, std of last generation, mean of best individual, std of best individual
    results = [
        np.min(rstat), np.mean(rstat), np.std(rstat), np.mean(np.min(rstat, axis=1)), np.std(np.min(rstat, axis=1)) 
    ]
    print(results)
    return results
    

## Probabilistic mutation

In [3]:
from pycgp.mutation import probabilistic_mutation
from pycgp.gems import GemSM, MatchSMStrategy
all_measurements = {}
EV_PARAMS['mutation'] = probabilistic_mutation
EV_PARAMS['gem_type'] = GemSM
EV_PARAMS['match_strategy'] = MatchSMStrategy

### ProbM, 10 nodes

In [4]:
%%time
random.seed(1)

PARAMS['n_cols']      = 10
EV_PARAMS['gems']     = False

all_measurements['10,false'] = run_experiment(PARAMS, EV_PARAMS, X)

0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, [-39, -5.2800000000000002, 7.2209140695621077, -16.5, 7.807048097712733]
CPU times: user 1min 50s, sys: 143 ms, total: 1min 51s
Wall time: 1min 51s


### ProbM, 50 nodes

In [5]:
%%time
stats = []; random.seed(1);

PARAMS['n_cols']      = 50
EV_PARAMS['gems']     = False

all_measurements['50,false'] = run_experiment(PARAMS, EV_PARAMS, X)

0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, [-88, -18.640000000000001, 23.640862928412741, -62.100000000000001, 12.581335382223939]
CPU times: user 3min 56s, sys: 64 ms, total: 3min 56s
Wall time: 3min 57s


### ProbM, 100 nodes

In [6]:
%%time
stats = []; random.seed(1);

PARAMS['n_cols']      = 100
EV_PARAMS['gems']     = False

all_measurements['100,false'] = run_experiment(PARAMS, EV_PARAMS, X)

0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, [-89, -29.84, 33.064397771621366, -80.349999999999994, 10.42245172692107]
CPU times: user 9min 20s, sys: 260 ms, total: 9min 21s
Wall time: 9min 21s


### ProbM, 10 nodes, Gems

In [7]:
%%time
stats = []; random.seed(1);

PARAMS['n_cols']      = 10
EV_PARAMS['gems']     = True
EV_PARAMS['j_box_size'] = 5

all_measurements['10,false,5'] = run_experiment(PARAMS, EV_PARAMS, X)

0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, [-27, -4.7699999999999996, 6.4650676717262598, -15.949999999999999, 5.6962707098592151]
CPU times: user 1min 35s, sys: 24 ms, total: 1min 35s
Wall time: 1min 35s


### ProbM, 50 nodes, Gems

In [8]:
%%time
stats = []; random.seed(1);

PARAMS['n_cols']      = 50
EV_PARAMS['gems']     = True
EV_PARAMS['j_box_size'] = 5

all_measurements['50,false,5'] = run_experiment(PARAMS, EV_PARAMS, X)

0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, [-88, -18.640000000000001, 23.640862928412741, -62.100000000000001, 12.581335382223939]
CPU times: user 4min 8s, sys: 152 ms, total: 4min 9s
Wall time: 4min 9s


### ProbM, 100 nodes, Gems

In [9]:
%%time
stats = []; random.seed(1);

PARAMS['n_cols']      = 100
EV_PARAMS['gems']     = True
EV_PARAMS['j_box_size'] = 5

all_measurements['100,false,5'] = run_experiment(PARAMS, EV_PARAMS, X)

0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, [-89, -29.84, 33.064397771621366, -80.349999999999994, 10.42245172692107]
CPU times: user 9min 57s, sys: 360 ms, total: 9min 58s
Wall time: 9min 58s


## jBox size 10

In [10]:
%%time
stats = []; random.seed(1);

PARAMS['n_cols']        = 10
EV_PARAMS['gems']       = True
EV_PARAMS['j_box_size'] = 10

all_measurements['10,false,10'] = run_experiment(PARAMS, EV_PARAMS, X)

0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, [-28, -4.5899999999999999, 6.6529617464705151, -16.350000000000001, 5.7902936022277833]
CPU times: user 1min 51s, sys: 64 ms, total: 1min 51s
Wall time: 1min 51s


In [11]:
%%time
stats = []; random.seed(1);

PARAMS['n_cols']        = 50
EV_PARAMS['gems']       = True
EV_PARAMS['j_box_size'] = 10

all_measurements['50,false,10'] = run_experiment(PARAMS, EV_PARAMS, X)

0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, [-88, -18.640000000000001, 23.640862928412741, -62.100000000000001, 12.581335382223939]
CPU times: user 4min 8s, sys: 52 ms, total: 4min 8s
Wall time: 4min 8s


In [12]:
%%time
stats = []; random.seed(1);

PARAMS['n_cols']        = 100
EV_PARAMS['gems']       = True
EV_PARAMS['j_box_size'] = 10

all_measurements['100,false,10'] = run_experiment(PARAMS, EV_PARAMS, X)

0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, [-89, -29.84, 33.064397771621366, -80.349999999999994, 10.42245172692107]
CPU times: user 10min, sys: 492 ms, total: 10min 1s
Wall time: 10min 1s


# Summary

In [13]:
import pandas as pd
df = pd.DataFrame.from_dict(all_measurements, orient='index')
df.columns = ['best fitness', 'mean of last gen', 'std of last gen', 'mean of best individual', 'std of best indvidiual']
df

Unnamed: 0,best fitness,mean of last gen,std of last gen,mean of best individual,std of best indvidiual
"10,false",-39,-5.28,7.220914,-16.5,7.807048
"50,false",-88,-18.64,23.640863,-62.1,12.581335
"100,false",-89,-29.84,33.064398,-80.35,10.422452
"10,false,5",-27,-4.77,6.465068,-15.95,5.696271
"50,false,5",-88,-18.64,23.640863,-62.1,12.581335
"100,false,5",-89,-29.84,33.064398,-80.35,10.422452
"10,false,10",-28,-4.59,6.652962,-16.35,5.790294
"50,false,10",-88,-18.64,23.640863,-62.1,12.581335
"100,false,10",-89,-29.84,33.064398,-80.35,10.422452


## Summary

** Without gems **

| nodes | time     | max fitness | last gen mean | last gen std | best ind mean | best ind std |
|-------|----------|------------:|------------  :|-------------:|--------------:|-------------:|
| 10    |  1min 36s| 89          | 23.4          | 18.56        | 36.4          | 18.58        |
| 50    |  5min 47s| 89          | 47.32         | 28.03        | 53.95         | 26.74        |
| 100   |  17min 3s| 89          | 56.41         | 25.79        | 63.15         | 23.87        |

** With gems, jbox 5 **

| nodes | time     | max fitness | last gen mean | last gen std | best ind mean | best ind std |
|-------|----------|------------:|------------  :|-------------:|--------------:|-------------:|
| 10    |  1min 59s| 89          | 21.73         | 24.19        | 33.5          | 28.36        |
| 50    |  5min 56s| 89          | 54.25         | 31.27        | 61.85         | 28.01        |
| 100   | 17min 57s| 89          | 52.43         | 27.61        | 56.35         | 25.74        |

** With gems, jbox 10 **

| nodes | time     | max fitness | last gen mean | last gen std | best ind mean | best ind std |
|-------|----------|------------:|------------  :|-------------:|--------------:|-------------:|
| 10    |  1min 46s| 89          | 19.93         | 20.56        | 32.15         | 24.41        |
| 50    |  5min  6s| 89          | 43.21         | 30.97        | 48.45         | 29.54        |
| 100   | 20min  8s| 89          | 55.48         | 24.47        | 63.15         | 21.54        |