In [1]:
import logging
import os
import random
import numpy as np
import pandas as pd

from src.configuration_space.LKH import CONFIGURATION_SPACE
from src.constant import DATA_DIR, MAX_WORKERS, TEMP_DIR
from src.experiment.GlobalExperiment import GlobalExperiment
from src.experiment.ParhydraExperiment import ParhydraExperiment
from src.experiment.CepsMy1Experiment import CepsMy1Experiment
from src.experiment.PcitExperiment import PcitExperiment, _Clustering
from src.instance.TSP_Instance import TSP_Instance, TSP_InstanceSet
from src.portfolio import Portfolio
from src.solver.TSP_LKH_Solver import TSP_LKH_Solver
from src.experiment.CepsExperiment import CepsExperiment
pd.options.display.max_columns = 999

In [2]:
train_instances, test_instances = TSP_InstanceSet.train_test_from_index_file(
    filepath=DATA_DIR / "TSP" / "CEPS_benchmark" / "index.json",
    train_size=5,
    seed=0,
)

In [3]:
t_c = 60
K = 2
n = 2
solver_class = TSP_LKH_Solver
instance_class= TSP_Instance

experiment = GlobalExperiment(
    t_c=t_c,
    K=K,
    n=n,
    solver_class=solver_class,
    instance_class=instance_class,
)

best_portfolio = experiment.construct_portfolio(train_instances)

[2024-12-09 23:17:26] INFO      [GLOBAL] Start!
[2024-12-09 23:17:26] INFO      Attempt 1/2
[2024-12-09 23:17:26] DEBUG     SMAC configuration, time: [60. 60.]
[2024-12-09 23:17:26] DEBUG     SMAC iteration 1, configuration: {'0__ASCENT_CANDIDATES': 45, '0__BACKBONE_TRIALS': 0, '0__BACKTRACKING': 'YES', '0__CANDIDATE_SET_TYPE': 'QUADRANT', '0__EXTRA_CANDIDATES': 0, '0__EXTRA_CANDIDATE_SET_TYPE': 'QUADRANT', '0__GAIN23': 'NO', '0__GAIN_CRITERION': 'NO', '0__INITIAL_STEP_SIZE': 1, '0__INITIAL_TOUR_ALGORITHM': 'NEAREST-NEIGHBOR', '0__INITIAL_TOUR_FRACTION': 0.1410864457464, '0__KICKS': 3, '0__KICK_TYPE': 5, '0__MAX_BREADTH': 1850229859, '0__MAX_CANDIDATES': 4, '0__MOVE_TYPE': 3, '0__PATCHING_A': 4, '0__PATCHING_C': 2, '0__POPULATION_SIZE': 8, '0__RESTRICTED_SEARCH': 'YES', '0__SUBGRADIENT': 'YES', '0__SUBSEQUENT_MOVE_TYPE': 5, '0__SUBSEQUENT_PATCHING': 'NO', '1__ASCENT_CANDIDATES': 51, '1__BACKBONE_TRIALS': 0, '1__BACKTRACKING': 'YES', '1__CANDIDATE_SET_TYPE': 'DELAUNAY', '1__EXTRA_CANDID

In [3]:
t_c = 60
K = 2
n = 2
solver_class = TSP_LKH_Solver
instance_class= TSP_Instance

experiment = ParhydraExperiment(
    t_c=t_c,
    K=K,
    n=n,
    solver_class=solver_class,
    instance_class=instance_class,
)

best_portfolio = experiment.construct_portfolio(train_instances)

[2024-12-09 23:20:45] INFO      [PARHYDRA] Start!
[2024-12-09 23:20:45] INFO      Solver 1/2
[2024-12-09 23:20:45] INFO      Attempt 1/2
[2024-12-09 23:20:45] DEBUG     SMAC configuration, time: [60.]
[2024-12-09 23:20:45] DEBUG     SMAC iteration 1, configuration: {'0__ASCENT_CANDIDATES': 52, '0__BACKBONE_TRIALS': 1, '0__BACKTRACKING': 'YES', '0__CANDIDATE_SET_TYPE': 'ALPHA', '0__EXTRA_CANDIDATES': 7, '0__EXTRA_CANDIDATE_SET_TYPE': 'QUADRANT', '0__GAIN23': 'NO', '0__GAIN_CRITERION': 'YES', '0__INITIAL_STEP_SIZE': 1, '0__INITIAL_TOUR_ALGORITHM': 'QUICK-BORUVKA', '0__INITIAL_TOUR_FRACTION': 0.5820197920751, '0__KICKS': 3, '0__KICK_TYPE': 0, '0__MAX_BREADTH': 954863081, '0__MAX_CANDIDATES': 10, '0__MOVE_TYPE': 3, '0__PATCHING_A': 3, '0__PATCHING_C': 1, '0__POPULATION_SIZE': 8, '0__RESTRICTED_SEARCH': 'YES', '0__SUBGRADIENT': 'YES', '0__SUBSEQUENT_MOVE_TYPE': 6, '0__SUBSEQUENT_PATCHING': 'NO'}
[2024-12-09 23:20:45] DEBUG     executor start
[2024-12-09 23:20:45] DEBUG     (0, 0) fn submitt

In [None]:
# train_instances, test_instances = TSP_InstanceSet.train_test_from_index_file(
#     filepath=DATA_DIR / "TSP" / "CEPS_benchmark" / "index.json",
#     train_size=5,
#     seed=0,
# )

# solver_class = TSP_LKH_Solver
# instance_class= TSP_Instance
# t_c = 200
# K = 2
# n = 2
# t_ini = sum([i * train_instances.size * 10 for i in range(1, K + 1)]) * 2
# t_i = 10
# max_iter = 1

# experiment = CepsMy1Experiment(
#     t_c=t_c,
#     t_ini=t_ini,
#     t_i=t_i,
#     K=K,
#     n=n,
#     max_iter=max_iter,
#     solver_class=solver_class,
#     instance_class=instance_class,
# )

# best_portfolio = experiment.construct_portfolio(train_instances)

In [None]:
# t_c = 50
# K = 2
# n = 2
# max_iter = 2
# solver_class = TSP_LKH_Solver
# instance_class = TSP_Instance

# experiment = PcitExperiment(
#     t_c=t_c,
#     K=K,
#     n=n,
#     max_iter=max_iter,
#     solver_class=solver_class,
#     instance_class=instance_class,
# )

# best_portfolio = experiment.construct_portfolio(train_instances)

In [22]:
# remaining_time = np.ones(shape=(K, )) * np.inf
# best_portfolio.evaluate(test_instances, remaining_time, "test")

In [4]:
from src.database import db_connect
conn = db_connect()

In [63]:
import sqlite3
conn = sqlite3.connect("_archive/2/GLOBAL.db")
# conn = sqlite3.connect("database/2024_11_18_22_52_24.db")

In [5]:
df_solvers = pd.read_sql_query("SELECT * FROM solvers", conn)
df_solvers

Unnamed: 0,id,ASCENT_CANDIDATES,BACKBONE_TRIALS,BACKTRACKING,CANDIDATE_SET_TYPE,EXTRA_CANDIDATES,EXTRA_CANDIDATE_SET_TYPE,GAIN23,GAIN_CRITERION,INITIAL_STEP_SIZE,INITIAL_TOUR_ALGORITHM,INITIAL_TOUR_FRACTION,KICKS,KICK_TYPE,MAX_BREADTH,MAX_CANDIDATES,MOVE_TYPE,PATCHING_A,PATCHING_C,POPULATION_SIZE,RESTRICTED_SEARCH,SUBGRADIENT,SUBSEQUENT_MOVE_TYPE,SUBSEQUENT_PATCHING
0,144362650971809487,52,0,NO,ALPHA,6,QUADRANT,YES,NO,3,BORUVKA,0.544441,1,4,1317085677,8,6,5,5,23,YES,YES,0,YES
1,615709552088896777,59,0,NO,NEAREST-NEIGHBOR,7,QUADRANT,YES,YES,1,QUICK-BORUVKA,0.372006,2,0,954473433,2,2,1,5,27,NO,NO,3,YES
2,1864895902672780320,55,0,YES,QUADRANT,0,QUADRANT,NO,NO,1,QUICK-BORUVKA,0.967205,5,0,958079260,2,6,4,3,48,YES,NO,6,NO
3,1729021862493197193,50,0,YES,NEAREST-NEIGHBOR,7,QUADRANT,YES,NO,2,BORUVKA,0.536592,3,5,1456287484,5,6,1,0,9,NO,NO,0,NO


In [6]:
df_instances = pd.read_sql_query("SELECT * FROM instances", conn)
df_instances

Unnamed: 0,id
0,data/TSP/CEPS_benchmark/cluster_netgen/40.tsp
1,data/TSP/CEPS_benchmark/grid/04.tsp
2,data/TSP/CEPS_benchmark/grid/33.tsp
3,data/TSP/CEPS_benchmark/rotation/45.tsp
4,data/TSP/CEPS_benchmark/uniform_portgen/11.tsp


In [7]:
df = pd.read_sql_query("SELECT * FROM results", conn)
# df.to_excel("tmp.xlsx")
df

Unnamed: 0,instance_id,solver_id,cost,time,comment,created_at
0,data/TSP/CEPS_benchmark/cluster_netgen/40.tsp,144362650971809487,100.0,10.0,configuration,2024-12-09 22:04:23
1,data/TSP/CEPS_benchmark/cluster_netgen/40.tsp,615709552088896777,100.0,10.0,configuration,2024-12-09 22:04:23
2,data/TSP/CEPS_benchmark/grid/04.tsp,144362650971809487,100.0,10.0,configuration,2024-12-09 22:04:24
3,data/TSP/CEPS_benchmark/grid/04.tsp,615709552088896777,100.0,10.0,configuration,2024-12-09 22:04:24
4,data/TSP/CEPS_benchmark/grid/33.tsp,144362650971809487,100.0,10.0,configuration,2024-12-09 22:04:24
5,data/TSP/CEPS_benchmark/grid/33.tsp,615709552088896777,2.92,2.92,configuration,2024-12-09 22:04:25
6,data/TSP/CEPS_benchmark/rotation/45.tsp,615709552088896777,2.23,2.23,configuration,2024-12-09 22:04:27
7,data/TSP/CEPS_benchmark/uniform_portgen/11.tsp,615709552088896777,100.0,10.0,configuration,2024-12-09 22:04:35
8,data/TSP/CEPS_benchmark/rotation/45.tsp,144362650971809487,100.0,10.0,validation,2024-12-09 22:04:47
9,data/TSP/CEPS_benchmark/uniform_portgen/11.tsp,144362650971809487,100.0,10.0,validation,2024-12-09 22:04:48


In [67]:
df["comment"].value_counts()

configuration    48051
test              1880
Name: comment, dtype: int64

In [68]:
df.loc[df["comment"] == "configuration"]

Unnamed: 0,instance_id,solver_id,cost,time,comment,created_at
0,data/TSP/CEPS_benchmark/cluster_netgen/40.tsp,6xJZWF2RoHDF8qv96yvmmtIvc2yNAsBPXrATK8KbGv4=,2.48,2.48,configuration,2024-11-14 18:02:55
1,data/TSP/CEPS_benchmark/cluster_netgen/40.tsp,6xJZWF2RoHDF8qv96yvmmtIvc2yNAsBPXrATK8KbGv4=,2.71,2.71,configuration,2024-11-14 18:02:56
2,data/TSP/CEPS_benchmark/cluster_netgen/40.tsp,6xJZWF2RoHDF8qv96yvmmtIvc2yNAsBPXrATK8KbGv4=,2.51,2.51,configuration,2024-11-14 18:02:56
3,data/TSP/CEPS_benchmark/cluster_netgen/40.tsp,6xJZWF2RoHDF8qv96yvmmtIvc2yNAsBPXrATK8KbGv4=,2.70,2.70,configuration,2024-11-14 18:02:56
4,data/TSP/CEPS_benchmark/grid/04.tsp,6xJZWF2RoHDF8qv96yvmmtIvc2yNAsBPXrATK8KbGv4=,1.25,1.25,configuration,2024-11-14 18:02:56
...,...,...,...,...,...,...
48046,data/TSP/CEPS_benchmark/expansion/03.tsp,-h2B28ccRe-yzTl2a3lwwxylCmrRHS-vxS79397kvK8=,100.00,10.00,configuration,2024-11-15 17:13:42
48047,data/TSP/CEPS_benchmark/explosion/41.tsp,-h2B28ccRe-yzTl2a3lwwxylCmrRHS-vxS79397kvK8=,100.00,10.00,configuration,2024-11-15 17:13:42
48048,data/TSP/CEPS_benchmark/grid/00.tsp,-h2B28ccRe-yzTl2a3lwwxylCmrRHS-vxS79397kvK8=,100.00,10.00,configuration,2024-11-15 17:13:42
48049,data/TSP/CEPS_benchmark/linearprojection/40.tsp,-h2B28ccRe-yzTl2a3lwwxylCmrRHS-vxS79397kvK8=,100.00,10.00,configuration,2024-11-15 17:13:47


In [69]:
_ = df.loc[df["comment"] == "test"].pivot_table(index="instance_id", columns="solver_id", values="cost")
_["best"] = np.argmin(_.values, axis=1)
_["min"] = _.iloc[:, :-1].min(axis=1)
_

solver_id,Cu1fs0kAKTm6MvSmj1HE7v652JohHK4_FBLT892SLfw=,dy-AxBvs-EUcd2LSsJqSrEuubDx5B_Q-DpE3kA2r4qA=,lhdh2qy2Ma9s1ijBiY9HyqWX9MHEmcDlPKhAxfFPQrI=,rcr1q6ddFDv9xNL9YmvTWpRb6vcZic1ybu6XuF9RlfE=,best,min
instance_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
data/TSP/CEPS_benchmark/cluster/00.tsp,4.95,2.50,100.0,7.61,1,2.50
data/TSP/CEPS_benchmark/cluster/01.tsp,1.35,4.40,100.0,100.00,0,1.35
data/TSP/CEPS_benchmark/cluster/02.tsp,0.60,100.00,100.0,100.00,0,0.60
data/TSP/CEPS_benchmark/cluster/03.tsp,1.44,1.07,100.0,2.53,1,1.07
data/TSP/CEPS_benchmark/cluster/04.tsp,100.00,100.00,100.0,6.35,3,6.35
...,...,...,...,...,...,...
data/TSP/CEPS_benchmark/uniform_portgen/45.tsp,1.51,2.18,100.0,1.51,0,1.51
data/TSP/CEPS_benchmark/uniform_portgen/46.tsp,0.89,2.07,100.0,1.38,0,0.89
data/TSP/CEPS_benchmark/uniform_portgen/47.tsp,0.89,1.11,100.0,1.14,0,0.89
data/TSP/CEPS_benchmark/uniform_portgen/48.tsp,0.52,0.56,100.0,4.02,0,0.52


In [70]:
_["min"].describe()

count    470.000000
mean       2.021872
std        7.958167
min        0.450000
25%        0.670000
50%        0.945000
75%        1.600000
max      100.000000
Name: min, dtype: float64

In [71]:
(_["min"] > 90).value_counts()

False    467
True       3
Name: min, dtype: int64

In [62]:
_.loc[lambda x: x["min"] < 90, "best"].value_counts()

0    142
3    119
2    100
1     98
Name: best, dtype: int64

In [None]:
_.sort_values(by="min")

In [None]:
# config = df_solvers.loc[df_solvers["id"] == "OJQGNYe__-omEPLuUJkSzOuFdCnYPLzZd99VQqxW2gM="].drop(columns=["id"]).iloc[0].to_dict()
# config = Configuration(configuration_space=CONFIGURATION_SPACE, values=config)
# solver = TSP_LKH_Solver(config=config)

# instance = TSP_Instance(filepath="data/TSP/CEPS_benchmark/cluster_netgen/18.tsp", optimum=10555222.0)

# solver.solve(instance)

In [None]:
# import json
# with open(DATA_DIR / "TSP" / "index.json") as f:
#     index = json.load(f)

# new_index = {}

# for k, v in index.items():
#     path = k.split("/")
#     file = path[-1]
#     file_no_ext = file.split(".")[0]
#     if "_" in file_no_ext:
#         a, b = file_no_ext.split("_")
#         n = str((int(a) - 4) * 10 + int(b)).zfill(2)
#         new_file = f"{n}.tsp"
#     else:
#         file_no_ext = str(int(file_no_ext)).zfill(2)
#         new_file = f"{file_no_ext}.tsp"
#     new_path = path[:-1] + [new_file]
#     new_k = "/".join(new_path)
#     new_index[new_k] = float(v)

#     path1 = DATA_DIR / k;
#     path2 = DATA_DIR / new_k;
#     path1.rename(path2)

# new_index = {k: new_index[k] for k in sorted(new_index.keys())}

# with open(DATA_DIR / "TSP" / "index.json", "w") as f:
#     json.dump(new_index, f, indent=4)

# new_index