In [24]:
import yaml

def generate_model_template(dataset_name, model_name, best_params = None, param_grid = None):
    
    template = {
                "dataset": dataset_name,
                "model": model_name,
                "best_params": {},
                "param_grid": {}
    }
    

    if best_params:
        template["best_params"] = best_params
        
    if param_grid:
        template["param_grid"] = param_grid

    return template


# S1DCNN

In [25]:
s1dcnn_small_default_grid =  {
        "outer_params": {
            "hyperopt_evals":1,
            "max_epochs": 1,
            "early_stopping": True,
            "shuffle": True,
            "validation_fraction": 0.15,
            "early_stopping_patience": 5},
            "batch_size": [128],
            "hidden_size": [4096],
            "optimizer_fn": {
        "Adam": {"weight_decay": [0.0],
                "learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}}}


s1dcnn_large_default_grid =  {
        "outer_params": {
            "hyperopt_evals":1,
            "max_epochs": 1,
            "early_stopping": True,
            "shuffle": True,
            "validation_fraction": 0.15,
            "early_stopping_patience": 5},
            "batch_size": [1024],
            "hidden_size": [4096],
            "optimizer_fn": {
        "Adam": {"weight_decay": [0.0],
                "learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}}}
    

# MLP

In [26]:
mlp_small_default_grid = {
            "outer_params": {"hyperopt_evals": 1,
                            "early_stopping": True,
                            "cv_size": 4,
                            "validation_fraction": 0.15,
                            "n_iter_no_change": 10,
                            "max_iter": 1000},
            "hidden_layer_sizes": [[100]],
            "activation": ["relu"],
            "solver": ["adam"],
            "batch_size": [128],
        }

mlp_large_default_grid = {
            "outer_params": {"hyperopt_evals": 1,
                            "early_stopping": True,
                            "cv_size": 4,
                            "validation_fraction": 0.15,
                            "n_iter_no_change": 10,
                            "max_iter": 1000},
            "hidden_layer_sizes": [[100]],
            "activation": ["relu"],
            "solver": ["adam"],
            "batch_size": [1024],
        }

# XGB

In [27]:
xgb_small_default_grid ={
            "outer_params": {"hyperopt_evals": 1,
                            "validation_fraction": 0.15,
                            "early_stopping_rounds": 30,
                            "verbose": False},
            "learning_rate": [0.3],
}

xgb_large_default_grid ={
            "outer_params": {"hyperopt_evals": 1,
                            "validation_fraction": 0.15,
                            "early_stopping_rounds": 30,
                            "verbose": False},
            "learning_rate": [0.3],
}


# CatBoost

In [28]:
catboost_small_default_grid = {
    
    "outer_params": {"hyperopt_evals": 1,
    "validation_fraction": 0.15,
    "early_stopping_rounds": 100,
    "verbose": False},
    "iterations": [500],
}

catboost_large_default_grid = {
    
    "outer_params": {"hyperopt_evals": 1,
    "validation_fraction": 0.15,
    "early_stopping_rounds": 100,
    "verbose": False},
    "iterations": [500],
}


# GATE

In [29]:
gate_large_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [1024],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}

gate_small_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [128],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}

# TABNET

In [30]:
tabnet_large_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [1024],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}


tabnet_small_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [128],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}


# FTT Transformer

In [31]:
fttransformer_large_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [1024],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}

fttransformer_small_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [128],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
}

# GANDALF

In [32]:
gandalf_large_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [1024],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}

gandalf_small_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [128],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}

# Node

In [33]:
node_large_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [1024],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}

node_small_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [128],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}

# Category Embedding

In [34]:
catembed_large_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [1024],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},

}

catembed_small_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [128],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
}



# TabTransformer

In [35]:
tabtransformer_large_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [1024],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
}

tabtransformer_small_default_grid = {
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [128],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
    
}


# AutoINT

In [36]:
autoint_large_default_grid ={
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [1024],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
}


autoint_small_default_grid ={
"outer_params": {"hyperopt_evals": 1,
                "auto_lr_find": True,
                "max_epochs": 1000,
                "val_size": 0.15,
                "early_stopping_patience": 5},

"batch_size": [128],
    
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},
}


# RESNET

In [37]:
# Set the desired parameters
resnet_small_default_grid = {
    "outer_params":{"hyperopt_evals": 1,
                            "max_epochs": 1000,
                            "early_stopping": True,
                            "early_stopping_patience":6,
                            "validation_fraction": 0.2},
                               "resnet_depth":["resnet18"],
                            "batch_size": [128],
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},

                          }

# Set the desired parameters
resnet_large_default_grid = {"outer_params":{"hyperopt_evals": 1,
                            "max_epochs": 1000,
                            "early_stopping": True,
                            "early_stopping_patience":6,
                            "validation_fraction": 0.2},
                               "resnet_depth":["resnet18"],
                            "batch_size": [1024],
"optimizer_fn": {
"Adam": {"weight_decay": [0.0],
"learning_rate": [0.001]}},
"scheduler_fn": {"ReduceLROnPlateau": {"factor": [0.1], "patience": [5]}},

                          }

In [38]:
templatesfull =[
#generate_model_template("housing","xgb",param_grid = xgb_large_default_grid.copy()),
#generate_model_template("housing", "mlp",  param_grid = mlp_large_default_grid.copy()),
#generate_model_template("housing", "resnet", param_grid = resnet_large_default_grid.copy()),
#generate_model_template("housing", "s1dcnn", param_grid = s1dcnn_large_default_grid.copy()),
#generate_model_template("housing", "tabnet",param_grid = tabnet_large_default_grid.copy()),
#generate_model_template("housing", "gate", param_grid = gate_large_default_grid.copy()),
#generate_model_template("housing","fttransformer", param_grid = fttransformer_large_default_grid.copy()),
#generate_model_template("housing", "categoryembedding", param_grid = catembed_large_default_grid.copy()),
#generate_model_template("housing","gandalf", param_grid = gandalf_large_default_grid.copy()),
#generate_model_template("housing","node", param_grid = node_large_default_grid.copy()),
#generate_model_template("housing","autoint", param_grid = autoint_large_default_grid.copy()),
#generate_model_template("housing","tabtransformer", param_grid = tabtransformer_large_default_grid.copy()),
#generate_model_template("housing","catboost", param_grid = catboost_large_default_grid.copy()),
#
#generate_model_template("iris","xgb",param_grid = xgb_large_default_grid.copy()),
#generate_model_template("iris", "mlp",  param_grid = mlp_large_default_grid.copy()),
#generate_model_template("iris", "resnet", param_grid = resnet_small_default_grid.copy()),
#generate_model_template("iris", "s1dcnn", param_grid = s1dcnn_small_default_grid.copy()),
#generate_model_template("iris", "tabnet",param_grid = tabnet_small_default_grid.copy()),
#generate_model_template("iris", "gate", param_grid = gate_small_default_grid.copy()),
#generate_model_template("iris","fttransformer", param_grid = fttransformer_small_default_grid.copy()),
#generate_model_template("iris", "categoryembedding", param_grid = catembed_small_default_grid.copy()),
#generate_model_template("iris","gandalf", param_grid = gandalf_small_default_grid.copy()),
#generate_model_template("iris","node", param_grid = node_small_default_grid.copy()),
#generate_model_template("iris","autoint", param_grid = autoint_small_default_grid.copy()),
#generate_model_template("iris","tabtransformer", param_grid = tabtransformer_small_default_grid.copy()),
#generate_model_template("iris","catboost", param_grid = catboost_small_default_grid.copy()),
#
#generate_model_template("titanic","xgb",param_grid = xgb_small_default_grid.copy()),
#generate_model_template("titanic", "mlp",  param_grid = mlp_small_default_grid.copy()),
#generate_model_template("titanic", "resnet", param_grid = resnet_small_default_grid.copy()),
#generate_model_template("titanic", "s1dcnn", param_grid = s1dcnn_small_default_grid.copy()),
#generate_model_template("titanic", "tabnet",param_grid = tabnet_small_default_grid.copy()),
#generate_model_template("titanic", "gate", param_grid = gate_small_default_grid.copy()),
#generate_model_template("titanic","fttransformer", param_grid = fttransformer_small_default_grid.copy()),
#generate_model_template("titanic", "categoryembedding", param_grid = catembed_small_default_grid.copy()),
#generate_model_template("titanic","gandalf", param_grid = gandalf_small_default_grid.copy()),
#generate_model_template("titanic","node", param_grid = node_small_default_grid.copy()),
#generate_model_template("titanic","autoint", param_grid = autoint_small_default_grid.copy()),
#generate_model_template("titanic","tabtransformer", param_grid = tabtransformer_small_default_grid.copy()),
#generate_model_template("titanic","catboost", param_grid = catboost_small_default_grid.copy()),
#
#generate_model_template("adult","xgb",param_grid = xgb_small_default_grid.copy()),
#generate_model_template("adult", "mlp",  param_grid = mlp_small_default_grid.copy()),
#generate_model_template("adult", "resnet", param_grid = resnet_small_default_grid.copy()),
#generate_model_template("adult", "s1dcnn", param_grid = s1dcnn_small_default_grid.copy()),
#generate_model_template("adult", "tabnet",param_grid = tabnet_small_default_grid.copy()),
#generate_model_template("adult", "gate", param_grid = gate_small_default_grid.copy()),
#generate_model_template("adult","fttransformer", param_grid = fttransformer_small_default_grid.copy()),
#generate_model_template("adult", "categoryembedding", param_grid = catembed_small_default_grid.copy()),
#generate_model_template("adult","gandalf", param_grid = gandalf_small_default_grid.copy()),
#generate_model_template("adult","node", param_grid = node_small_default_grid.copy()),
#generate_model_template("adult","autoint", param_grid = autoint_small_default_grid.copy()),
#generate_model_template("adult","tabtransformer", param_grid = tabtransformer_small_default_grid.copy()),
#generate_model_template("adult","catboost", param_grid = catboost_small_default_grid.copy()),
#
#generate_model_template("heloc","xgb",param_grid = xgb_large_default_grid.copy()),
#generate_model_template("heloc", "mlp",  param_grid = mlp_large_default_grid.copy()),
#generate_model_template("heloc", "resnet", param_grid = resnet_large_default_grid.copy()),
#generate_model_template("heloc", "s1dcnn", param_grid = s1dcnn_large_default_grid.copy()),
#generate_model_template("heloc", "tabnet",param_grid = tabnet_large_default_grid.copy()),
#generate_model_template("heloc", "gate", param_grid = gate_large_default_grid.copy()),
#generate_model_template("heloc","fttransformer", param_grid = fttransformer_large_default_grid.copy()),
#generate_model_template("heloc", "categoryembedding", param_grid = catembed_large_default_grid.copy()),
#generate_model_template("heloc","gandalf", param_grid = gandalf_large_default_grid.copy()),
#generate_model_template("heloc","node", param_grid = node_large_default_grid.copy()),
#generate_model_template("heloc","autoint", param_grid = autoint_large_default_grid.copy()),
#generate_model_template("heloc","tabtransformer", param_grid = tabtransformer_large_default_grid.copy()),
#generate_model_template("heloc","catboost", param_grid = catboost_large_default_grid.copy()),
#
#generate_model_template("covertype","xgb",param_grid = xgb_large_default_grid.copy()),
#generate_model_template("covertype", "mlp",  param_grid = mlp_large_default_grid.copy()),
#generate_model_template("covertype", "resnet", param_grid = resnet_large_default_grid.copy()),
#generate_model_template("covertype", "s1dcnn", param_grid = s1dcnn_large_default_grid.copy()),
#generate_model_template("covertype", "tabnet",param_grid = tabnet_large_default_grid.copy()),
#generate_model_template("covertype", "gate", param_grid = gate_large_default_grid.copy()),
#generate_model_template("covertype","fttransformer", param_grid = fttransformer_large_default_grid.copy()),
#generate_model_template("covertype", "categoryembedding", param_grid = catembed_large_default_grid.copy()),
#generate_model_template("covertype","gandalf", param_grid = gandalf_large_default_grid.copy()),
#generate_model_template("covertype","node", param_grid = node_large_default_grid.copy()),
#generate_model_template("covertype","autoint", param_grid = autoint_large_default_grid.copy()),
#generate_model_template("covertype","tabtransformer", param_grid = tabtransformer_large_default_grid.copy()),
#generate_model_template("covertype","catboost", param_grid = catboost_large_default_grid.copy()),
#
#generate_model_template("creditcard","xgb",param_grid = xgb_large_default_grid.copy()),
#generate_model_template("creditcard", "mlp",  param_grid = mlp_large_default_grid.copy()),
#generate_model_template("creditcard", "resnet", param_grid = resnet_large_default_grid.copy()),
#generate_model_template("creditcard", "s1dcnn", param_grid = s1dcnn_large_default_grid.copy()),
#generate_model_template("creditcard", "tabnet",param_grid = tabnet_large_default_grid.copy()),
#generate_model_template("creditcard", "gate", param_grid = gate_large_default_grid.copy()),
#generate_model_template("creditcard","fttransformer", param_grid = fttransformer_large_default_grid.copy()),
#generate_model_template("creditcard", "categoryembedding", param_grid = catembed_large_default_grid.copy()),
#generate_model_template("creditcard","gandalf", param_grid = gandalf_large_default_grid.copy()),
#generate_model_template("creditcard","node", param_grid = node_large_default_grid.copy()),
#generate_model_template("creditcard","autoint", param_grid = autoint_large_default_grid.copy()),
#generate_model_template("creditcard","tabtransformer", param_grid = tabtransformer_large_default_grid.copy()),
#generate_model_template("creditcard","catboost", param_grid = catboost_large_default_grid.copy()),
#
#generate_model_template("diabetes","xgb",param_grid = xgb_large_default_grid.copy()),
#generate_model_template("diabetes", "mlp",  param_grid = mlp_large_default_grid.copy()),
#generate_model_template("diabetes", "resnet", param_grid = resnet_large_default_grid.copy()),
#generate_model_template("diabetes", "s1dcnn", param_grid = s1dcnn_large_default_grid.copy()),
#generate_model_template("diabetes", "tabnet",param_grid = tabnet_large_default_grid.copy()),
#generate_model_template("diabetes", "gate", param_grid = gate_large_default_grid.copy()),
#generate_model_template("diabetes","fttransformer", param_grid = fttransformer_large_default_grid.copy()),
#generate_model_template("diabetes", "categoryembedding", param_grid = catembed_large_default_grid.copy()),
#generate_model_template("diabetes","gandalf", param_grid = gandalf_large_default_grid.copy()),
#generate_model_template("diabetes","node", param_grid = node_large_default_grid.copy()),
#generate_model_template("diabetes","autoint", param_grid = autoint_large_default_grid.copy()),
#generate_model_template("diabetes","tabtransformer", param_grid = tabtransformer_large_default_grid.copy()),
#generate_model_template("diabetes","catboost", param_grid = catboost_large_default_grid.copy()),
]



In [39]:
templates1 = [
generate_model_template("creditcard", "categoryembedding", param_grid = catembed_large_default_grid.copy()),
             ]


templates2 = [
generate_model_template("creditcard","gandalf", param_grid = gandalf_large_default_grid.copy()),
            ]

templates3 =[
generate_model_template("creditcard","fttransformer", param_grid = fttransformer_large_default_grid.copy()),
            ]


templates4 = [
generate_model_template("creditcard","xgb",param_grid = xgb_large_default_grid.copy()),
generate_model_template("creditcard", "mlp",  param_grid = mlp_large_default_grid.copy()),
generate_model_template("creditcard", "resnet", param_grid = resnet_large_default_grid.copy()),
generate_model_template("creditcard", "s1dcnn", param_grid = s1dcnn_large_default_grid.copy()),
generate_model_template("creditcard", "tabnet",param_grid = tabnet_large_default_grid.copy()),
generate_model_template("creditcard", "gate", param_grid = gate_large_default_grid.copy()),
generate_model_template("creditcard","fttransformer", param_grid = fttransformer_large_default_grid.copy()),
generate_model_template("creditcard", "categoryembedding", param_grid = catembed_large_default_grid.copy()),
generate_model_template("creditcard","gandalf", param_grid = gandalf_large_default_grid.copy()),
generate_model_template("creditcard","node", param_grid = node_large_default_grid.copy()),
generate_model_template("creditcard","autoint", param_grid = autoint_large_default_grid.copy()),
generate_model_template("creditcard","tabtransformer", param_grid = tabtransformer_large_default_grid.copy()),
generate_model_template("creditcard","catboost", param_grid = catboost_large_default_grid.copy()),

generate_model_template("diabetes","xgb",param_grid = xgb_large_default_grid.copy()),
generate_model_template("diabetes", "mlp",  param_grid = mlp_large_default_grid.copy()),
generate_model_template("diabetes", "resnet", param_grid = resnet_large_default_grid.copy()),
generate_model_template("diabetes", "s1dcnn", param_grid = s1dcnn_large_default_grid.copy()),
generate_model_template("diabetes", "tabnet",param_grid = tabnet_large_default_grid.copy()),
generate_model_template("diabetes", "gate", param_grid = gate_large_default_grid.copy()),
generate_model_template("diabetes","fttransformer", param_grid = fttransformer_large_default_grid.copy()),
generate_model_template("diabetes", "categoryembedding", param_grid = catembed_large_default_grid.copy()),
generate_model_template("diabetes","gandalf", param_grid = gandalf_large_default_grid.copy()),
generate_model_template("diabetes","node", param_grid = node_large_default_grid.copy()),
generate_model_template("diabetes","autoint", param_grid = autoint_large_default_grid.copy()),
generate_model_template("diabetes","tabtransformer", param_grid = tabtransformer_large_default_grid.copy()),
generate_model_template("diabetes","catboost", param_grid = catboost_large_default_grid.copy()), 
]

In [40]:
templates1

[{'dataset': 'creditcard',
  'model': 'categoryembedding',
  'best_params': {},
  'param_grid': {'outer_params': {'hyperopt_evals': 1,
    'auto_lr_find': True,
    'max_epochs': 1000,
    'val_size': 0.15,
    'early_stopping_patience': 5},
   'batch_size': [1024],
   'optimizer_fn': {'Adam': {'weight_decay': [0.0], 'learning_rate': [0.001]}},
   'scheduler_fn': {'ReduceLROnPlateau': {'factor': [0.1], 'patience': [5]}}}}]

# smart allocation

In [49]:
import pandas as pd
df = pd.read_csv(r"../output/DEFAULT_FINAL.csv")

existing_combinations = df[['dataset','model','run_time']].drop_duplicates()
existing_combinations["k"] = existing_combinations["dataset"] + "/"+existing_combinations["model"]
# Create a dictionary from the two columns
result_dict = dict(zip(existing_combinations['k'], existing_combinations['run_time']))
result_dict

{'titanic/xgb': 0.8589644432067871,
 'titanic/catboost': 31.50035524368286,
 'titanic/s1dcnn': 1.7213973999023438,
 'titanic/mlp': 0.6242845058441162,
 'titanic/tabnet': 43.0797176361084,
 'titanic/gate': 261.26929807662964,
 'titanic/fttransformer': 49.21467804908752,
 'titanic/categoryembedding': 15.77493143081665,
 'titanic/gandalf': 23.48309540748596,
 'titanic/autoint': 17.96108341217041,
 'titanic/tabtransformer': 40.36361908912659,
 'housing/xgb': 3.364003419876098,
 'housing/mlp': 45.612706422805786,
 'housing/s1dcnn': 5.777416467666626,
 'housing/tabnet': 319.87358140945435,
 'housing/gate': 1054.847452878952,
 'housing/fttransformer': 432.6749892234802,
 'housing/categoryembedding': 156.21004390716553,
 'housing/gandalf': 154.9490053653717,
 'housing/autoint': 125.7169153690338,
 'housing/tabtransformer': 58.195149421691895,
 'housing/catboost': 19.411662817001343,
 'iris/xgb': 1.4646930694580078,
 'iris/mlp': 0.0967371463775634,
 'iris/s1dcnn': 0.2426009178161621,
 'iris/tab

In [50]:
initial_queue = [i["dataset"]+ "/" + i["model"] for i in templates4]
initial_queue

['creditcard/xgb',
 'creditcard/mlp',
 'creditcard/resnet',
 'creditcard/s1dcnn',
 'creditcard/tabnet',
 'creditcard/gate',
 'creditcard/fttransformer',
 'creditcard/categoryembedding',
 'creditcard/gandalf',
 'creditcard/node',
 'creditcard/autoint',
 'creditcard/tabtransformer',
 'creditcard/catboost',
 'diabetes/xgb',
 'diabetes/mlp',
 'diabetes/resnet',
 'diabetes/s1dcnn',
 'diabetes/tabnet',
 'diabetes/gate',
 'diabetes/fttransformer',
 'diabetes/categoryembedding',
 'diabetes/gandalf',
 'diabetes/node',
 'diabetes/autoint',
 'diabetes/tabtransformer',
 'diabetes/catboost']

In [51]:
initial_queue_weight = {k:v for k,v in result_dict.items() if k in initial_queue}
initial_queue_weight

{'creditcard/xgb': 313.9121091365814,
 'diabetes/xgb': 355.15988636016846,
 'creditcard/mlp': 77.6291835308075,
 'diabetes/mlp': 58.441378355026245,
 'diabetes/resnet': 3681.2359352111816,
 'diabetes/s1dcnn': 36.27701234817505,
 'diabetes/tabnet': 453.4024243354797,
 'diabetes/gate': 1246.7368049621582,
 'creditcard/resnet': 2291.049815416336,
 'creditcard/s1dcnn': 128.48831725120544,
 'creditcard/tabnet': 1305.791773557663,
 'diabetes/fttransformer': 2329.688283681869,
 'diabetes/categoryembedding': 233.2397403717041,
 'diabetes/gandalf': 295.1254608631134,
 'diabetes/autoint': 254.42786955833435,
 'creditcard/gate': 3787.559681653976,
 'diabetes/tabtransformer': 2395.721166610718,
 'diabetes/catboost': 353.6942434310913,
 'creditcard/autoint': 513.1119918823242,
 'creditcard/tabtransformer': 459.1066381931305,
 'creditcard/catboost': 83.85805225372314}

In [44]:
# create a dictionary with the "runs" key and the list of dictionaries
runs_dict = {"runs": templates1}

# write the dictionary to a YAML file
with open("../configuration/experiment_runs1.yml", "w") as f:
    yaml.dump(templates1, f, sort_keys = False, default_flow_style=False)

In [45]:
# create a dictionary with the "runs" key and the list of dictionaries
runs_dict = {"runs": templates2}

# write the dictionary to a YAML file
with open("../configuration/experiment_runs2.yml", "w") as f:
    yaml.dump(templates2, f, sort_keys = False, default_flow_style=False)

In [46]:
# create a dictionary with the "runs" key and the list of dictionaries
runs_dict = {"runs": templates3}

# write the dictionary to a YAML file
with open("../configuration/experiment_runs3.yml", "w") as f:
    yaml.dump(templates3, f, sort_keys = False, default_flow_style=False)