### Imports

In [1]:
# If updates on imported files aren't detected, restart the kernel (we'll need to find an automatic solution for this)

import numpy as np
from icecream import ic

from typing import List, Tuple, Dict


### Evolution Helper

In [2]:
import random
from typing import List
from gxgp.node import Node
from utils.operations_dict import basic_function_set, complex_function_set

### Tree Generation

In [3]:
def generate_random_tree(max_height: int, pc: float, terminal_list: List[str],
                         constants: list[float] = None, p_pick_constant: float = 0.2, p_cut_tree: float = 0.2,
                         verbose: bool = False, cur_depth: int = 0) -> Node:
    """
    Generate a random symbolic expression tree.

    Mandatory Parameters
    ----------
    max_height : int
        The maximum height of the tree. The height of a tree is the length of the longest path from the root to a leaf (e.g. height of a leaf is 0).
    pc : float
        The probability of choosing a complex function over a basic function.
    terminal_list : List[str]
        The terminal list to choose from. Example: ['x0', 'x1', 'x2']

    Optional Parameters
    ----------
    constants : list[float]
        A list of constants that can be used in the tree (default is None).
    p_pick_constant : float
        The probability of choosing a constant over a terminal (default is 0.2).
    p_cut_tree : float
        The probability of cutting the tree early (default is 0.2).    
    verbose : bool    
        Whether to print debug information (default is False).
    cur_depth : int
        The exploration depth (e.g. depth of root is 0)

    Returns
    -------
    Node
        A Node object representing the root of the tree.
    """
    indent = ' ' * (cur_depth * 2)

    # Cut the tree early with probability 0.2
    if (random.random() < p_cut_tree) or max_height == 0:  
        # If constants are provided, choose one with probability p_pick_constant
        if constants is not None and random.random() < p_pick_constant: 
            terminal = random.choice(constants) 
        # Otherwise, pick from the terminal set
        else:                                                
            terminal = random.choice(terminal_list)
        
        if verbose: print(f"{indent}Picked terminal: {terminal}")

        # Set the height of the node to 0
        my_node = Node(terminal)
        my_node.set_height(0)
        return my_node
    else:
        # Choose a complex function with probability pc
        if random.random() < pc:                       
            func = random.choice(list(complex_function_set.keys()))
            if verbose: print(f"{indent}Chose complex function {func}")
            num_children = complex_function_set[func].__code__.co_argcount  # Numero di argomenti della funzione
            children = [generate_random_tree(max_height - 1, pc, terminal_list, constants, p_pick_constant, p_cut_tree, verbose, cur_depth + 1)
                        for _ in range(num_children)]
            
            # Set height
            cur_height = max([child.get_height() for child in children]) + 1
            my_node = Node(complex_function_set[func], children, name=func)
            my_node.set_height(cur_height)
            return my_node
        # Otherwise, choose a basic function
        else:                                           
            func = random.choice(list(basic_function_set.keys()))
            if verbose: print(f"{indent}Chose basic function {func}")
            num_children = basic_function_set[func].__code__.co_argcount  # Numero di argomenti della funzione
            children = [generate_random_tree(max_height - 1, pc, terminal_list, constants, p_pick_constant, p_cut_tree, verbose, cur_depth + 1)
                        for _ in range(num_children)]
            # Set height
            cur_height = max([child.get_height() for child in children]) + 1
            my_node = Node(basic_function_set[func], children, name=func)
            my_node.set_height(cur_height)
            return my_node

def generate_random_tree_with_all_terminal(max_height: int, pc: float, terminal_list: List[str],
                         constants: list[float] = None, p_pick_constant: float = 0.2, p_cut_tree: float = 0.2,
                         verbose: bool = False, cur_depth: int = 0, picked_terminal: set[str]=set()) -> Node:
    """
    Generate a random symbolic expression tree.

    Mandatory Parameters
    ----------
    max_height : int
        The maximum height of the tree. The height of a tree is the length of the longest path from the root to a leaf (e.g. height of a leaf is 0).
    pc : float
        The probability of choosing a complex function over a basic function.
    terminal_list : List[str]
        The terminal list to choose from. Example: ['x0', 'x1', 'x2']

    Optional Parameters
    ----------
    constants : list[float]
        A list of constants that can be used in the tree (default is None).
    p_pick_constant : float
        The probability of choosing a constant over a terminal (default is 0.2).
    p_cut_tree : float
        The probability of cutting the tree early (default is 0.2).    
    verbose : bool    
        Whether to print debug information (default is False).
    cur_depth : int
        The exploration depth (e.g. depth of root is 0)

    Returns
    -------
    Node
        A Node object representing the root of the tree.
    """
    indent = ' ' * (cur_depth * 2)

    # Cut the tree early with probability 0.2
    if (random.random() < p_cut_tree) or max_height == 0:  
        # If constants are provided, choose one with probability p_pick_constant
        if constants is not None and random.random() < p_pick_constant and len(picked_terminal) == len(terminal_list): 
            terminal = random.choice(constants) 
        # Otherwise, pick from the terminal set
        else:                                                
            terminal = random.choice(terminal_list)
            picked_terminal.add(terminal)
        
        if verbose: print(f"{indent}Picked terminal: {terminal}")

        # Set the height of the node to 0
        my_node = Node(terminal)
        my_node.set_height(0)
        return my_node
    else:
        # Choose a complex function with probability pc
        if random.random() < pc:                       
            func = random.choice(list(complex_function_set.keys()))
            if verbose: print(f"{indent}Chose complex function {func}")
            num_children = complex_function_set[func].__code__.co_argcount  # Numero di argomenti della funzione
            children = [generate_random_tree_with_all_terminal(max_height - 1, pc, terminal_list, constants, p_pick_constant, p_cut_tree, verbose, cur_depth + 1,picked_terminal)
                        for _ in range(num_children)]
            
            # Set height
            cur_height = max([child.get_height() for child in children]) + 1
            my_node = Node(complex_function_set[func], children, name=func)
            my_node.set_height(cur_height)
            return my_node
        # Otherwise, choose a basic function
        else:                                           
            func = random.choice(list(basic_function_set.keys()))
            if verbose: print(f"{indent}Chose basic function {func}")
            num_children = basic_function_set[func].__code__.co_argcount  # Numero di argomenti della funzione
            children = [generate_random_tree_with_all_terminal(max_height - 1, pc, terminal_list, constants, p_pick_constant, p_cut_tree, verbose, cur_depth + 1,picked_terminal)
                        for _ in range(num_children)]
            # Set height
            cur_height = max([child.get_height() for child in children]) + 1
            my_node = Node(basic_function_set[func], children, name=func)
            my_node.set_height(cur_height)
            return my_node

### Mutations

In [4]:
def point_mutation(Tree: Node, terminal_list: List[str], constants: list[float] = None, p_pick_constant: float = 0.2, pc: float = 0.2) -> Node:
    """
    Mutate a tree by changing a random node to a new random node.

    Parameters
    ----------
    Tree : Node
        The tree to mutate.
    terminal_list : List[str]
        The terminal list to choose from. Example: ['x0', 'x1', 'x2']
    constants : list[float]
        A list of constants that can be used in the tree.
    p_pick_constant : float
        The probability of choosing a constant over a terminal.
    pc : float
        The probability of choosing a complex function over a basic function.

    Returns
    -------
    Node
        The mutated tree.
    """

    # Get the list of nodes in the tree
    node = Tree.get_random_node()

    # If the node is a terminal, change it to a new terminal
    if node.is_leaf:
        if constants is not None and random.random() < p_pick_constant:
            terminal = random.choice(constants)
        else:
            terminal = random.choice(terminal_list)
        node.set_func(terminal)
        return Tree
    # Otherwise, change it to a new function maintaining the arity
    else:
        if random.random() < pc:
            while True:
                func = random.choice(list(complex_function_set.keys()))
                arity = complex_function_set[func].__code__.co_argcount
                if arity == node._arity:
                    break
            node.set_func(complex_function_set[func], name=func)
        else:
            while True:
                func = random.choice(list(basic_function_set.keys()))
                arity = basic_function_set[func].__code__.co_argcount
                if arity == node._arity:
                    break
            node.set_func(basic_function_set[func], name=func)
        return Tree
    
def subtree_mutation(Tree: Node, terminal_list: List[str], constants: list[float] = None, p_pick_constant: float = 0.2, pc: float = 0.2, height: int = 3, verbose: bool = False) -> Node:
    """
    Mutate a tree by changing a random subtree to a new random subtree.

    Parameters
    ----------
    Tree : Node
        The tree to mutate.
    terminal_list : List[str]
        The terminal list to choose from. Example: ['x0', 'x1', 'x2']
    constants : list[float]
        A list of constants that can be used in the tree.
    p_pick_constant : float
        The probability of choosing a constant over a terminal.
    pc : float
        The probability of choosing a complex function over a basic function.
    height : int
        The maximum height of the new subtree.

    Returns
    -------
    Node
        The mutated tree.
    """

    # Get the list of nodes in the tree
    node = Tree.get_random_node()

    if verbose:
        print(f"Node to mutate: {node._str} at height {node._height}")

    new_subtree = generate_random_tree(height, pc, terminal_list, constants, p_pick_constant)
    node = node.replace_tree_shallow(new_subtree)
    return Tree

def expansion_mutation(Tree: Node, terminal_list: List[str], constants: list[float] = None, p_pick_constant: float = 0.2, pc: float = 0.2, height: int = 3, verbose: bool = False) -> Node:
    """
    Mutate a tree by expanding a random node to a new random subtree.

    Parameters
    ----------
    Tree : Node
        The tree to mutate.
    terminal_list : List[str]
        The terminal list to choose from. Example: ['x0', 'x1', 'x2']
    constants : list[float]
        A list of constants that can be used in the tree.
    p_pick_constant : float
        The probability of choosing a constant over a terminal.
    pc : float
        The probability of choosing a complex function over a basic function.
    height : int
        The maximum height of the new subtree.

    Returns
    -------
    Node
        The mutated tree.
    """
    # Get the list of nodes in the tree
    node = random.choice(Tree.get_leafs())

    if verbose:
        print(f"Node to mutate: {node._str} at height {node._height}")  
    
    
    new_subtree = generate_random_tree(height, pc, terminal_list, constants, p_pick_constant)
    node = node.replace_tree_shallow(new_subtree)
    return Tree

def collaps_mutation(Tree: Node, terminal_list: List[str], constants: list[float] = None, p_pick_constant: float = 0.2, pc: float = 0.2, verbose: bool = False) -> Node:
    """
    Mutate a tree by collapsing a random node to a terminal.

    Parameters
    ----------
    Tree : Node
        The tree to mutate.
    terminal_list : List[str]
        The terminal list to choose from. Example: ['x0', 'x1', 'x2']
    constants : list[float]
        A list of constants that can be used in the tree.
    p_pick_constant : float
        The probability of choosing a constant over a terminal.
    pc : float
        The probability of choosing a complex function over a basic function.

    Returns
    -------
    Node
        The mutated tree.
    """

    # Get the list of nodes in the tree
    node = Tree.get_random_node()

    if verbose:
        print(f"Node to mutate: {node._str} at height {node._height}")

   # possible choices
    possible_choices = node.get_leafs()


    node.replace_tree_shallow(random.choice(possible_choices))
    return Tree


def permutation_mutation(Tree: Node, terminal_list: List[str], constants: list[float] = None, p_pick_constant: float = 0.2, pc: float = 0.2,verbose: bool = False) -> Node:
    """
    Mutate a tree by permuting the children of a random node through a rotation.

    Parameters
    ----------
    Tree : Node
        The tree to mutate.

    Returns
    -------
    Node
        The mutated tree.
    """

    # Extract a random node that has at least two children (so no leaves and single input functions)
    found = False
    for i in range(20):
        father = Tree.get_random_node()
        if father._arity > 1:
            found = True
            break
    if not found:
        return Tree
    
    if verbose:
        print(f"Father node: {father._str} at height {father._height}. It has {len(father._successors)} children: [", end="")
        for i, child in enumerate(father._successors):
            print(f"{child._str},", end=" ")
        print("]")

    
    new_successors = ()
    for i, child in enumerate(father._successors):
        new_successors = new_successors + (father._successors[i-1],)

    father._successors = new_successors

    if verbose:
        print(f"New children: [", end="")
        for i, child in enumerate(father._successors):
            print(f"{child._str},", end=" ")
        print("]")

    return Tree

def hoist_mutation(Tree: Node, terminal_list: List[str], constants: list[float] = None, p_pick_constant: float = 0.2, pc: float = 0.2,verbose: bool = False) -> Node:
    """
    Mutate a tree by replacing the root with a random child.

    Parameters
    ----------
    Tree : Node
        The tree to mutate.

    Returns
    -------
    Node
        The mutated tree.
    """

    random_node = Tree.get_random_node()
    return random_node

### crossover

In [5]:
def recombination_crossover(Tree1: Node, Tree2: Node, verbose: bool = False) -> Tuple[Node, Node]:
    """
    Recombine two trees by swapping a random subtree.

    Parameters
    ----------
    Tree1 : Node
        The first tree.
    Tree2 : Node
        The second tree.

    Returns
    -------
    Tuple[Node, Node]
        The recombined trees.
    """

    # Get the list of nodes in the trees
    node1 = Tree1.get_random_node()
    node2 = Tree2.get_random_node()

    if verbose:
        print(f"Node1 to swap: {node1._str} at height {node1._height}")
        print(f"Node2 to swap: {node2._str} at height {node2._height}")

    # Swap the subtrees
    temp1 = node1.clone()
    temp2 = node2.clone()
    node1.replace_tree_shallow(temp2)
    node2.replace_tree_shallow(temp1)

    return Tree1, Tree2



### Load Data

In [6]:
from gxgp import Node
problem_number = 3
problem = np.load(f'./data/problem_{problem_number}.npz')
input = problem['x']
labels = problem['y']

print("Input shape:", input.shape, " Example of sample: ", input[:, 0])
print("Labels shape:", labels.shape, " Example of label: ", labels[0])

# Terminal set
terminal_list = ['x' + str(i) for i in range(input.shape[0])]

print("terminal_list: ", terminal_list)
# Main

Input shape: (3, 5000)  Example of sample:  [ 1.52827812 -2.67876092 -3.73351453]
Labels shape: (5000,)  Example of label:  40.96071445158248
terminal_list:  ['x0', 'x1', 'x2']


### examples for generating trees
You can fine tune the size of the output by modifying draw() from draw.py

In [7]:
from utils.terminal_constants import crammed_constants

# height = 5
# initialized = generate_random_tree(height, 0.2, terminal_list, constants=crammed_constants, p_pick_constant=0.7, p_cut_tree=0.01, verbose=True)
# initialized.draw()

In [8]:
# collapsed = initialized.collapse_constants()
# collapsed.draw()

In [9]:
"""second=generate_random_tree(height, 0.2, terminal_list, constants=crammed_constants, p_pick_constant=0.4, p_cut_tree=0.05, verbose=True)
second.draw()"""

'second=generate_random_tree(height, 0.2, terminal_list, constants=crammed_constants, p_pick_constant=0.4, p_cut_tree=0.05, verbose=True)\nsecond.draw()'

In [10]:
"""for obj in recombination_crossover(initialized, second, verbose=True):
    obj.draw()"""

'for obj in recombination_crossover(initialized, second, verbose=True):\n    obj.draw()'

### Create input formatted

In [11]:
print("input shape is ", input.shape)

vars = []
for j in range(input.shape[1]):
    cur_vars = {'x'+str(i): input[i][j] for i in range(input.shape[0])}
    # print("cur_vars is ", cur_vars)
    vars.append(cur_vars)
vars = np.array(vars)

print("vars shape is ", vars.shape)

input shape is  (3, 5000)
vars shape is  (5000,)


### fitness

In [12]:
import warnings
warnings.simplefilter("error", RuntimeWarning)

In [13]:
# def fitness(mytree: Node, vars, labels, verbose=False, penalized = 'sqrt'):
#     try:
#         output = np.array([mytree(**var) for var in vars])
#         mse = 100 * np.square(labels - output).mean()
#         if penalized == 'percent':
#             return mse +  mse * mytree.get_height() * 0.01 if mytree.get_height() > 0 else mse
#         else:
#             return mse * np.sqrt(mytree.get_height()) if mytree.get_height() > 0 else mse
#     except RuntimeWarning as e:
#         if verbose: print(f"caught runtime warning: {e}, setting fitness to inf")
#         return np.inf

# Fitness reverse
def fitness(mytree, vars, labels, penalized=None):
    try:
        output = np.array([mytree(**var) for var in vars])
        mytree.reeval_heights()
        height = mytree.get_height()
        mse = 100 * np.square(labels - output).mean()
        if height > 25:
            mse *= float(height - 15) / 10
        return mse
    except RuntimeWarning as e:
        # print(f"caught runtime warning: {e}, setting fitness to inf")
        return np.inf

#print(fitness(initialized, vars, labels))

def fitness_unscaled(mytree: Node, vars, labels, verbose=False):
    try:
        output = np.array([mytree(**var) for var in vars])
        mse = 100 * np.square(labels - output).mean()
        return mse
    except RuntimeWarning as e:
        if verbose: print(f"caught runtime warning: {e}, setting fitness to inf")
        return np.inf
#print(fitness(initialized, vars, labels))

In [14]:
from gxgp.gp_common import xover_swap_subtree
"""# Xover
def xover(tree1, tree2):
    return xover_swap_subtree(tree1, tree2)

# initialized.subtree.pop().draw() # this procedure is really similar to get_random_node, except there we use a list and random.choice
hoist_mutation(initialized, verbose=True).draw()"""

'# Xover\ndef xover(tree1, tree2):\n    return xover_swap_subtree(tree1, tree2)\n\n# initialized.subtree.pop().draw() # this procedure is really similar to get_random_node, except there we use a list and random.choice\nhoist_mutation(initialized, verbose=True).draw()'

### parent selection

In [15]:

def parent_selection(population, pre_calculated_fitnesses=None, penalized = 'sqrt'):
    if pre_calculated_fitnesses is None:
        candidates = sorted(np.random.choice(population, 2), key=lambda e: fitness(e,vars,labels, penalized=penalized))
        return candidates[0]
    else:
        #Random index between 0 and population size
        index1 = np.random.randint(0, len(population))
        index2 = np.random.randint(0, len(population))
        candidates = [population[index1], population[index2]]
        if pre_calculated_fitnesses[index1] > pre_calculated_fitnesses[index2]:
            return candidates[1]
        else:
            return candidates[0]

### utils functions

In [16]:
import concurrent
from concurrent.futures import ThreadPoolExecutor
from tqdm import tqdm
import numpy as np

def compute_pair_distance(i, j, population):
    return i, j, population[i].tree_distance(population[j])

def tree_distance(population, verbose="Calculating tree distance matrix"):
    n = len(population)
    matrix = np.zeros((n, n))
    pairs = [(i, j) for i in range(n) for j in range(i+1, n)]
    
    with ThreadPoolExecutor() as executor:
        futures = [executor.submit(compute_pair_distance, i, j, population) for i, j in pairs]
        for future in tqdm(concurrent.futures.as_completed(futures), desc=verbose, total=len(futures)):
            i, j, dist = future.result()
            matrix[i][j] = dist/ population[i].__len__() if population[i].__len__() > 0 else dist
            matrix[j][i] = dist/ population[j].__len__() if population[j].__len__() > 0 else dist

    
    return matrix

def random_mutation(p1=0.16, p2=0.16, p3=0.16, p4=0.16, p5=0.16):
    r = random.random()
    if r < p1:
        return point_mutation
    elif r < p1 + p2:
        return subtree_mutation
    elif r < p1 + p2 + p3:
        return expansion_mutation
    elif r < p1 + p2 + p3 + p4:
        return permutation_mutation
    elif r < p1 + p2 + p3 + p4 + p5:
        return collaps_mutation
    else:
        return hoist_mutation


### Training

In [None]:
from tqdm import tqdm
from concurrent.futures import ThreadPoolExecutor
import math


# Parameters
crossover = recombination_crossover
OFFSPRING_SIZE = 200
POPULATION_SIZE = 100
OUTSIDER_SIZE = math.ceil(OFFSPRING_SIZE*0.1)
pm = 0.15
x_elitism = 0.08
MAX_GENERATIONS = 100
HEIGHT = 5
PC = 0.1
P_PICK_CONSTANT = 0.4
P_CUT_TREE = 0.05


# Initialize the population
def initialize_population(_):
    return generate_random_tree_with_all_terminal(HEIGHT, PC, terminal_list, constants=crammed_constants, p_pick_constant=P_PICK_CONSTANT, p_cut_tree=P_CUT_TREE)

ALREADY_INITIALIZED = False
if not ALREADY_INITIALIZED:
    with ThreadPoolExecutor() as executor:
        population = list(tqdm(executor.map(initialize_population, range(POPULATION_SIZE)), desc="Initializing population", total=POPULATION_SIZE))

population = [tree.collapse_constants() for tree in population if tree is not None]    
# Remove identical trees
distance_matrix = tree_distance(population, verbose='Initial tree distances')
n = len(population)
# I need to keep only the first tree if there are identical trees
for i in range(n):
    for j in range(i + 1, n):
        if distance_matrix[i][j] == 0 and population[j] is not None:
            population[j] = None

population = [tree for tree in population if tree is not None]
for tree in population:
    tree.reeval_heights()

 # Evaluate the population
with ThreadPoolExecutor() as executor:
    fitnesses = np.array(list(tqdm(executor.map(lambda tree: fitness(tree, vars, labels, penalized='sqrt'), population), desc="Evaluating population", total=len(population))))
   
penalized = 'percent'
probabilities2 = [0.10, 0.10, 0.10, 0.10, 0.10]
probabilities1 = [0.16, 0.16, 0.16, 0.16, 0.16]

print(*probabilities1)

probabilities = probabilities1
# Training
for generation in range(MAX_GENERATIONS):
    if (generation >= 15):
        probabilities = probabilities2
        penalized = 'percent'
    if(generation >= 25):
        penalized = 'percent'
        probabilities = probabilities1

    pm = max(0.05, 0.2 - generation / MAX_GENERATIONS * 0.15)# from 0.2 to 0.05
    # Select the best individuals
    best_individuals = np.argsort(fitnesses)[:int(x_elitism * POPULATION_SIZE)]
    # Create the offspring
    offspring = []
    for _ in tqdm(range(OFFSPRING_SIZE), desc=f"Generation {generation}, Creating offsprings"):
        # Mutation
        if random.random() < pm:
            mutation = random_mutation(*probabilities)
            child = mutation(parent_selection(population, fitnesses).clone(), terminal_list, constants=crammed_constants, p_pick_constant=P_PICK_CONSTANT, pc=PC)
            child.reeval_heights()
            offspring.append(child)
        else:
            # Select parents
            parent1 = parent_selection(population, fitnesses, penalized).clone()
            parent2 = parent_selection(population, fitnesses, penalized).clone()
            # Crossover
            child1, child2 = crossover(parent1, parent2)
            child1.reeval_heights()
            child2.reeval_heights()
            offspring.extend([child1, child2])
    # Combine and select the best individuals
    population = [population[i] for i in best_individuals] + offspring

    # Remove identical trees
    population = [tree.collapse_constants() for tree in population if tree is not None]
    distance_matrix = tree_distance(population)
    n = len(population)
    # I need to keep only the first tree if there are identical trees
    for i in range(n):
        for j in range(i + 1, n):
            if distance_matrix[i][j] == 0 and population[j] is not None:
                population[j] = None
    
    # Sort population for summation of distance similarity
    summation = np.zeros(n)
    for i in range(n):
        summation[i] = np.sum(distance_matrix[i,:])
    
    distance_sorted = np.argsort(summation)[::-1]
    outsiders = set(distance_sorted[:OUTSIDER_SIZE])
    # Calculate fitness function
    with ThreadPoolExecutor() as executor:
        fitnesses_offspring = np.array(list(tqdm(executor.map(lambda tree: fitness(tree, vars, labels, penalized=penalized), offspring), desc="Evaluating offsprings", total=len(offspring))))

    # Select the best individuals and outsiders
    all_fitnesses = np.concatenate([fitnesses[best_individuals], fitnesses_offspring])
    best_fitnesses = set(np.argsort(all_fitnesses)[:POPULATION_SIZE])
    # Union between best individuals and outsiders
    union = best_fitnesses.union(outsiders)
    intersection = best_fitnesses.intersection(outsiders)

    union_filtered = [i for i in union if population[i] is not None]

    population = [population[i] for i in union_filtered]
    before = len(union)
    fitnesses = [all_fitnesses[i] for i in union_filtered]
    fitnesses = np.array(fitnesses)
    best_fitness = fitness_unscaled(population[0], vars, labels)
    print(f"Removed {before - len(population)} identical or invalid trees")
    print(f'Kept {len(outsiders) - len(intersection)} outsiders with low fitness')
    if generation > 0:
        print(f"Generation {generation} - Best fitness: {best_fitness} - Difference: {best_fitness - old_best_fitness}")
    else:
        print(f"Generation {generation} - Best fitness: {best_fitness}")
    old_best_fitness = best_fitness
    print(f"Population size: {len(population)}")
    print(f'Best height: {population[0].get_height()}')
    print(f"Mean height of the population: {np.mean([tree.get_height() for tree in population])}")


Initializing population: 100%|██████████| 100/100 [00:00<00:00, 33325.15it/s]


Initial tree distances: 100%|██████████| 4950/4950 [00:01<00:00, 4354.19it/s]
Evaluating population: 100%|██████████| 97/97 [00:38<00:00,  2.53it/s]


0.16 0.16 0.16 0.16 0.16


Generation 0, Creating offsprings: 100%|██████████| 200/200 [00:02<00:00, 88.99it/s] 
Calculating tree distance matrix: 100%|██████████| 67161/67161 [00:16<00:00, 4006.45it/s]
Evaluating offsprings: 100%|██████████| 359/359 [03:02<00:00,  1.97it/s]


Removed 11 identical or invalid trees
Kept 10 outsiders with low fitness
Generation 0 - Best fitness: 92159.46889142648
Population size: 99
Best height: 5
Mean height of the population: 4.03030303030303


Generation 1, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 109.11it/s]


Error in node exp: overflow encountered in exp


Calculating tree distance matrix: 100%|██████████| 66795/66795 [00:25<00:00, 2584.69it/s]
Evaluating offsprings: 100%|██████████| 358/358 [02:57<00:00,  2.01it/s] 


Removed 17 identical or invalid trees
Kept 17 outsiders with low fitness
Generation 1 - Best fitness: 86849.13784403335 - Difference: -5310.331047393134
Population size: 100
Best height: 7
Mean height of the population: 4.83


Generation 2, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 43.63it/s]
Calculating tree distance matrix: 100%|██████████| 67161/67161 [00:09<00:00, 6893.47it/s]
Evaluating offsprings: 100%|██████████| 359/359 [03:11<00:00,  1.88it/s]


Removed 10 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 2 - Best fitness: 81413.39421125336 - Difference: -5435.743632779995
Population size: 110
Best height: 7
Mean height of the population: 6.136363636363637


Generation 3, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 154.01it/s]
Calculating tree distance matrix: 100%|██████████| 66795/66795 [00:13<00:00, 4817.01it/s]
Evaluating offsprings: 100%|██████████| 358/358 [04:52<00:00,  1.23it/s] 


Removed 12 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 3 - Best fitness: 74910.5554848923 - Difference: -6502.838726361049
Population size: 108
Best height: 3
Mean height of the population: 6.657407407407407


Generation 4, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 139.03it/s]
Calculating tree distance matrix: 100%|██████████| 67161/67161 [00:13<00:00, 4831.98it/s]
Evaluating offsprings: 100%|██████████| 359/359 [05:00<00:00,  1.20it/s]


Removed 15 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 4 - Best fitness: 73441.32642330142 - Difference: -1469.229061590886
Population size: 105
Best height: 5
Mean height of the population: 6.742857142857143


Generation 5, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 159.65it/s]
Calculating tree distance matrix: 100%|██████████| 67161/67161 [00:13<00:00, 5078.11it/s]
Evaluating offsprings: 100%|██████████| 359/359 [04:38<00:00,  1.29it/s]


Removed 11 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 5 - Best fitness: 67709.56827699335 - Difference: -5731.758146308071
Population size: 109
Best height: 5
Mean height of the population: 6.559633027522936


Generation 6, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 152.88it/s]
Calculating tree distance matrix: 100%|██████████| 72390/72390 [00:14<00:00, 5040.07it/s]
Evaluating offsprings: 100%|██████████| 373/373 [04:54<00:00,  1.27it/s]


Removed 9 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 6 - Best fitness: 60803.48543900292 - Difference: -6906.082837990427
Population size: 111
Best height: 10
Mean height of the population: 7.63963963963964


Generation 7, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 157.24it/s]
Calculating tree distance matrix: 100%|██████████| 69751/69751 [00:14<00:00, 4759.78it/s]
Evaluating offsprings: 100%|██████████| 366/366 [05:01<00:00,  1.21it/s]


Removed 4 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 7 - Best fitness: 57586.907652824775 - Difference: -3216.577786178146
Population size: 116
Best height: 6
Mean height of the population: 7.5


Generation 8, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 147.58it/s]
Calculating tree distance matrix: 100%|██████████| 70500/70500 [00:15<00:00, 4634.77it/s]
Evaluating offsprings: 100%|██████████| 368/368 [05:11<00:00,  1.18it/s] 


Removed 6 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 8 - Best fitness: 57416.629921037296 - Difference: -170.27773178747884
Population size: 114
Best height: 8
Mean height of the population: 8.912280701754385


Generation 9, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 132.38it/s]
Calculating tree distance matrix: 100%|██████████| 68635/68635 [00:16<00:00, 4280.75it/s]
Evaluating offsprings: 100%|██████████| 363/363 [05:41<00:00,  1.06it/s] 


Removed 11 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 9 - Best fitness: 55582.78619922104 - Difference: -1833.843721816258
Population size: 109
Best height: 12
Mean height of the population: 9.256880733944953


Generation 10, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 123.20it/s]
Calculating tree distance matrix: 100%|██████████| 70500/70500 [00:17<00:00, 3919.04it/s]
Evaluating offsprings: 100%|██████████| 368/368 [06:14<00:00,  1.02s/it]


Removed 13 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 10 - Best fitness: 52995.174539080246 - Difference: -2587.611660140792
Population size: 107
Best height: 12
Mean height of the population: 10.30841121495327


Generation 11, Creating offsprings: 100%|██████████| 200/200 [00:01<00:00, 106.33it/s]
Calculating tree distance matrix: 100%|██████████| 69751/69751 [00:21<00:00, 3273.38it/s]
Evaluating offsprings: 100%|██████████| 366/366 [07:48<00:00,  1.28s/it] 


Removed 6 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 11 - Best fitness: 52353.01006661707 - Difference: -642.1644724631769
Population size: 114
Best height: 12
Mean height of the population: 11.473684210526315


Generation 12, Creating offsprings: 100%|██████████| 200/200 [00:02<00:00, 91.17it/s]
Calculating tree distance matrix: 100%|██████████| 67161/67161 [00:23<00:00, 2825.35it/s]
Evaluating offsprings: 100%|██████████| 359/359 [09:11<00:00,  1.54s/it]


Removed 1 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 12 - Best fitness: 45340.06879842716 - Difference: -7012.941268189912
Population size: 119
Best height: 9
Mean height of the population: 12.042016806722689


Generation 13, Creating offsprings: 100%|██████████| 200/200 [00:02<00:00, 78.56it/s]
Calculating tree distance matrix: 100%|██████████| 70500/70500 [00:28<00:00, 2471.20it/s]
Evaluating offsprings: 100%|██████████| 368/368 [10:30<00:00,  1.71s/it]


Removed 10 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 13 - Best fitness: 45340.06879842716 - Difference: 0.0
Population size: 110
Best height: 9
Mean height of the population: 13.927272727272728


Generation 14, Creating offsprings: 100%|██████████| 200/200 [00:02<00:00, 69.67it/s]
Calculating tree distance matrix: 100%|██████████| 69006/69006 [00:30<00:00, 2236.07it/s]
Evaluating offsprings: 100%|██████████| 364/364 [11:19<00:00,  1.87s/it]


Removed 6 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 14 - Best fitness: 45340.06879842716 - Difference: 0.0
Population size: 114
Best height: 9
Mean height of the population: 14.447368421052632


Generation 15, Creating offsprings: 100%|██████████| 200/200 [00:02<00:00, 71.05it/s]
Calculating tree distance matrix: 100%|██████████| 67896/67896 [00:30<00:00, 2198.34it/s]
Evaluating offsprings: 100%|██████████| 361/361 [11:09<00:00,  1.85s/it]


Removed 10 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 15 - Best fitness: 45340.06879842716 - Difference: 0.0
Population size: 110
Best height: 9
Mean height of the population: 14.918181818181818


Generation 16, Creating offsprings: 100%|██████████| 200/200 [00:02<00:00, 77.09it/s]
Calculating tree distance matrix: 100%|██████████| 68635/68635 [00:30<00:00, 2261.74it/s]
Evaluating offsprings: 100%|██████████| 363/363 [11:10<00:00,  1.85s/it]


Removed 8 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 16 - Best fitness: 44172.14525900092 - Difference: -1167.923539426236
Population size: 112
Best height: 14
Mean height of the population: 15.526785714285714


Generation 17, Creating offsprings: 100%|██████████| 200/200 [00:02<00:00, 70.47it/s]
Calculating tree distance matrix: 100%|██████████| 68265/68265 [00:32<00:00, 2078.78it/s]
Evaluating offsprings: 100%|██████████| 362/362 [11:51<00:00,  1.97s/it] 


Removed 10 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 17 - Best fitness: 40726.984870750945 - Difference: -3445.1603882499767
Population size: 110
Best height: 22
Mean height of the population: 16.845454545454544


Generation 18, Creating offsprings: 100%|██████████| 200/200 [00:03<00:00, 66.39it/s]
Calculating tree distance matrix: 100%|██████████| 70125/70125 [00:36<00:00, 1924.63it/s]
Evaluating offsprings: 100%|██████████| 367/367 [13:06<00:00,  2.14s/it] 


Removed 11 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 18 - Best fitness: 39513.74072982238 - Difference: -1213.2441409285675
Population size: 109
Best height: 22
Mean height of the population: 15.944954128440367


Generation 19, Creating offsprings: 100%|██████████| 200/200 [00:03<00:00, 60.28it/s]
Calculating tree distance matrix: 100%|██████████| 68265/68265 [00:40<00:00, 1701.04it/s]
Evaluating offsprings: 100%|██████████| 362/362 [14:27<00:00,  2.40s/it]


Removed 10 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 19 - Best fitness: 35410.686370570904 - Difference: -4103.054359251473
Population size: 110
Best height: 22
Mean height of the population: 17.363636363636363


Generation 20, Creating offsprings: 100%|██████████| 200/200 [00:03<00:00, 60.24it/s]
Calculating tree distance matrix: 100%|██████████| 66430/66430 [00:38<00:00, 1719.03it/s]
Evaluating offsprings: 100%|██████████| 357/357 [14:02<00:00,  2.36s/it]


Removed 13 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 20 - Best fitness: 35402.252559728 - Difference: -8.433810842907405
Population size: 107
Best height: 23
Mean height of the population: 18.009345794392523


Generation 21, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 48.27it/s]
Calculating tree distance matrix: 100%|██████████| 70125/70125 [00:48<00:00, 1450.70it/s]
Evaluating offsprings: 100%|██████████| 367/367 [17:42<00:00,  2.89s/it]  


Removed 12 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 21 - Best fitness: 35344.73367244998 - Difference: -57.518887278019974
Population size: 108
Best height: 23
Mean height of the population: 19.203703703703702


Generation 22, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 41.94it/s]
Calculating tree distance matrix: 100%|██████████| 73153/73153 [00:54<00:00, 1331.26it/s]
Evaluating offsprings: 100%|██████████| 375/375 [19:54<00:00,  3.19s/it] 


Removed 8 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 22 - Best fitness: 34598.58652352548 - Difference: -746.1471489244941
Population size: 112
Best height: 23
Mean height of the population: 19.160714285714285


Generation 23, Creating offsprings: 100%|██████████| 200/200 [00:05<00:00, 39.78it/s]
Calculating tree distance matrix: 100%|██████████| 72390/72390 [00:53<00:00, 1352.36it/s]
Evaluating offsprings: 100%|██████████| 373/373 [19:14<00:00,  3.09s/it] 


Removed 9 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 23 - Best fitness: 34396.47401405513 - Difference: -202.11250947035296
Population size: 111
Best height: 25
Mean height of the population: 19.72972972972973


Generation 24, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 47.65it/s]
Calculating tree distance matrix: 100%|██████████| 69751/69751 [00:51<00:00, 1365.05it/s]
Evaluating offsprings: 100%|██████████| 366/366 [19:00<00:00,  3.12s/it]


Removed 10 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 24 - Best fitness: 33948.65191750337 - Difference: -447.8220965517612
Population size: 110
Best height: 23
Mean height of the population: 19.681818181818183


Generation 25, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 41.41it/s]
Calculating tree distance matrix: 100%|██████████| 72010/72010 [00:57<00:00, 1257.92it/s]
Evaluating offsprings: 100%|██████████| 372/372 [20:38<00:00,  3.33s/it] 


Removed 8 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 25 - Best fitness: 6812.598943948828 - Difference: -27136.052973554542
Population size: 112
Best height: 23
Mean height of the population: 20.508928571428573


Generation 26, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 44.57it/s]
Calculating tree distance matrix: 100%|██████████| 66795/66795 [00:53<00:00, 1244.68it/s]
Evaluating offsprings: 100%|██████████| 358/358 [20:22<00:00,  3.41s/it] 


Removed 7 identical or invalid trees
Kept 19 outsiders with low fitness
Generation 26 - Best fitness: 6558.424005964072 - Difference: -254.17493798475516
Population size: 112
Best height: 23
Mean height of the population: 20.785714285714285


Generation 27, Creating offsprings: 100%|██████████| 200/200 [00:05<00:00, 38.14it/s]
Calculating tree distance matrix: 100%|██████████| 72771/72771 [01:01<00:00, 1175.84it/s]
Evaluating offsprings: 100%|██████████| 374/374 [21:37<00:00,  3.47s/it]  


Removed 5 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 27 - Best fitness: 6198.187896610603 - Difference: -360.23610935346915
Population size: 115
Best height: 23
Mean height of the population: 20.582608695652173


Generation 28, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 42.06it/s]
Calculating tree distance matrix: 100%|██████████| 74305/74305 [01:01<00:00, 1217.16it/s]
Evaluating offsprings: 100%|██████████| 378/378 [22:05<00:00,  3.51s/it]  


Removed 3 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 28 - Best fitness: 5558.901039400233 - Difference: -639.2868572103707
Population size: 117
Best height: 23
Mean height of the population: 19.846153846153847


Generation 29, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 43.08it/s]
Calculating tree distance matrix: 100%|██████████| 71253/71253 [00:56<00:00, 1260.86it/s]
Evaluating offsprings: 100%|██████████| 370/370 [20:55<00:00,  3.39s/it] 


Removed 4 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 29 - Best fitness: 5558.901039400233 - Difference: 0.0
Population size: 116
Best height: 23
Mean height of the population: 19.629310344827587


Generation 30, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 46.77it/s]
Calculating tree distance matrix: 100%|██████████| 72010/72010 [00:56<00:00, 1274.57it/s]
Evaluating offsprings: 100%|██████████| 372/372 [20:43<00:00,  3.34s/it] 


Removed 4 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 30 - Best fitness: 5558.901039400233 - Difference: 0.0
Population size: 116
Best height: 23
Mean height of the population: 19.370689655172413


Generation 31, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 48.05it/s]
Calculating tree distance matrix: 100%|██████████| 72010/72010 [00:52<00:00, 1359.60it/s]
Evaluating offsprings: 100%|██████████| 372/372 [19:41<00:00,  3.18s/it] 


Removed 2 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 31 - Best fitness: 3375.236769757327 - Difference: -2183.6642696429058
Population size: 118
Best height: 23
Mean height of the population: 19.347457627118644


Generation 32, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 42.39it/s]
Calculating tree distance matrix: 100%|██████████| 69751/69751 [00:53<00:00, 1316.04it/s]
Evaluating offsprings: 100%|██████████| 366/366 [19:57<00:00,  3.27s/it]


Removed 4 identical or invalid trees
Kept 20 outsiders with low fitness
Generation 32 - Best fitness: 2729.0279308255217 - Difference: -646.2088389318051
Population size: 116
Best height: 23
Mean height of the population: 19.336206896551722


Generation 33, Creating offsprings: 100%|██████████| 200/200 [00:04<00:00, 41.09it/s]
Calculating tree distance matrix:   7%|▋         | 5069/73153 [00:04<00:58, 1173.72it/s]

In [None]:
from datetime import datetime
conf = {
    "problem": problem_number,
    "crossover": crossover,
    "OFFSPRING_SIZE": OFFSPRING_SIZE,
    "POPULATION_SIZE": POPULATION_SIZE,
    "OUTSIDER_SIZE": OUTSIDER_SIZE,
    "pm": pm,
    "x_elitism": x_elitism,
    "MAX_GENERATIONS": MAX_GENERATIONS,
    "HEIGHT": HEIGHT,
    "PC": PC,
    "P_PICK_CONSTANT": P_PICK_CONSTANT,
    "P_CUT_TREE": P_CUT_TREE
}
def save_results(conf, res_function, res_fitness):
    cur_time = datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
    with open(f"./results/{cur_time}.txt", "w") as file:
        # Write the contents of conf
        file.write("# Configuration\n")
        file.write("conf = {\n")
        for key, value in conf.items():
            file.write(f"    '{key}': {value},\n")
        file.write("}\n\n")
        
        # Write the contents of res_function
        file.write("# Resulting function\n")
        file.write(f"{res_function}")
        
        # Write the contents of res_fitness
        file.write("# Resulting fitness\n")
        file.write(f"{res_fitness}")
save_results(conf, str(population[0]), best_fitness)

In [None]:
population[0].draw()
print(fitness(population[0], vars, labels))