In [1]:
import os
import optuna
import numpy as np
import pandas as pd
import warnings
from two_class_nested_cv import NestedCVOptimizer

warnings.filterwarnings('ignore')

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
def nested_cv(X, y, groups):
    """
    Run nested cross-validation with comprehensive results.
    Returns a DataFrame with all metrics, fold results, and summary statistics.
    """
    # Initialize and run optimizer
    optimizer = NestedCVOptimizer(
        X=X,
        y=y,
        groups=groups,
        positive_class="void",
        n_outer_folds=5,
        n_inner_folds=3,
        n_trials=50,
        random_state=42
    )
    
    print("\nRunning nested cross-validation...")
    summaries = optimizer.run_nested_cv()

    # Display summary
    print(f"\nðŸ“Š RESULTS SUMMARY:")
    print(f"Best performing model: {summaries['best_model'].upper()}")
    print(f"Best F1 (positive): {summaries['best_f1_positive']:.4f}")
    print(f"Best accuracy: {summaries['best_accuracy']:.4f}")

    results = optimizer.get_results_dataframe()

    
    return results

In [3]:
files = [
    'two_class_raw_1s_no.csv',
    'two_class_raw_1s_0.5.csv',
    'two_class_raw_1s_0.8.csv',
    'two_class_raw_2s_no.csv',
    'two_class_raw_2s_0.5.csv',
    'two_class_raw_2s_0.8.csv',
    'two_class_raw_3s_no.csv',
    'two_class_raw_3s_0.5.csv',
    'two_class_raw_3s_0.8.csv',
    'two_class_raw_4s_no.csv',
    'two_class_raw_4s_0.5.csv',
    'two_class_raw_4s_0.8.csv',
    'two_class_raw_5s_no.csv',
    'two_class_raw_5s_0.5.csv',
    'two_class_raw_5s_0.8.csv'
]

base_path = '/home/edumaba/Public/MPhil_Thesis/Code/wear_uropatch/feature_datasets/subject_based_norm/feature_set_2'

1. Loop through all files
2. Perform nested cross validation on each file
3. Store result in this format

![Output format](/home/edumaba/Public/MPhil_Thesis/Code/wear_uropatch/output_format.png)


In [4]:
all_results = {}
for file in files:
    data_path = os.path.join(base_path, file)
    features = pd.read_csv(data_path)
    features.drop(columns=['center_time', 'start_time', 'end_time'], inplace=True)
    details = file.split('_')
    exp_name = f"{details[3]}_{details[-1].replace('.csv', '')}"
    print(f"Nested cross-validation for {exp_name}")
    
    X = features.drop(columns=['label', 'experiment_id'])
    y = features['label']
    groups = features['experiment_id']
    
    results_df = nested_cv(X, y, groups)

    # Save to csv
    results_df.to_csv(f'/home/edumaba/Public/MPhil_Thesis/Code/wear_uropatch/sb_norm_analysis/two_class/nested_cv_results/feature_set_2/all_metrics_nested_cv_{exp_name}_zwei.csv')
    


[I 2025-09-01 15:46:11,168] A new study created in memory with name: no-name-f775d019-cca1-4598-81c9-3c688a331823


Nested cross-validation for 1s_no
Positive class 'void' is encoded as: 1
Label mapping: {'non-void': np.int64(0), 'void': np.int64(1)}

Running nested cross-validation...
Starting Binary Nested Cross-Validation with separate optimization for each model...
Positive class: 'void' (encoded as 1)

OUTER FOLD 1/5
Train size: 2004, Test size: 408
Class distribution in test set: {'non-void': np.int64(226), 'void': np.int64(182)}

--- Optimizing RF ---


[I 2025-09-01 15:46:12,477] Trial 0 finished with value: 0.5855703850995854 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5855703850995854.
[I 2025-09-01 15:46:14,030] Trial 1 finished with value: 0.5862348311678786 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5862348311678786.
[I 2025-09-01 15:46:24,443] Trial 2 finished with value: 0.5848938682947935 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5862348311678786.
[I 2025-09-01 15:46:35,999] Trial 3 finished with value: 0.5767940828091817 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 398, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 3, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6140


[I 2025-09-01 15:52:50,596] A new study created in memory with name: no-name-37d86293-86bb-4693-9ed7-cf5ac43199a1


rf test accuracy: 0.6887
rf test F1 (positive): 0.6558

--- Optimizing XGB ---


[I 2025-09-01 15:52:53,518] Trial 0 finished with value: 0.5296677801537175 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5296677801537175.
[I 2025-09-01 15:52:55,193] Trial 1 finished with value: 0.5103492384280561 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5296677801537175.
[I 2025-09-01 15:52:56,650] Trial 2 finished with value: 0.5473883666890901 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 146, 'max_depth': 6, 'learning_rate': 0.04955817146053165, 'subsample': 0.9438808931823901, 'colsample_bytree': 0.7496279102241226, 'min_child_weight': 5, 'gamma': 3.688904122873095, 'reg_alpha': 1.5180037003938782, 'reg_lambda': 1.839206620815206}
Best xgb F1 score (positive class): 0.5702


[I 2025-09-01 15:54:29,740] A new study created in memory with name: no-name-199f2c45-6df5-4295-8ec2-3d81b30956b5
[I 2025-09-01 15:54:29,787] Trial 0 finished with value: 0.5360280492947073 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5360280492947073.


xgb test accuracy: 0.6789
xgb test F1 (positive): 0.6289

--- Optimizing DT ---


[I 2025-09-01 15:54:30,347] Trial 1 finished with value: 0.4932709647590133 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5360280492947073.
[I 2025-09-01 15:54:30,391] Trial 2 finished with value: 0.6145835604077119 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6145835604077119.
[I 2025-09-01 15:54:30,420] Trial 3 finished with value: 0.6248878248185149 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6248878248185149.
[I 2025-09-01 15:54:30,446] Trial 4 finished with value: 0.6288879378804252 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 4, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6376
dt test accuracy: 0.6471
dt test F1 (positive): 0.5414

OUTER FOLD 2/5
Train size: 1939, Test size: 473
Class distribution in test set: {'non-void': np.int64(241), 'void': np.int64(232)}

--- Optimizing RF ---


[I 2025-09-01 15:54:35,318] Trial 0 finished with value: 0.5620493377631628 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5620493377631628.
[I 2025-09-01 15:54:36,711] Trial 1 finished with value: 0.5957192675420864 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5957192675420864.
[I 2025-09-01 15:54:45,574] Trial 2 finished with value: 0.5462705866175828 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5957192675420864.
[I 2025-09-01 15:54:56,528] Trial 3 finished with value: 0.5478735095149011 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 415, 'max_depth': 3, 'min_samples_split': 18, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.5975


[I 2025-09-01 15:57:31,082] A new study created in memory with name: no-name-92757ea2-dcd7-4c74-a284-7a48075e0d15


rf test accuracy: 0.6702
rf test F1 (positive): 0.6406

--- Optimizing XGB ---


[I 2025-09-01 15:57:35,418] Trial 0 finished with value: 0.5311621228772999 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5311621228772999.
[I 2025-09-01 15:57:37,424] Trial 1 finished with value: 0.5452027665786862 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5452027665786862.
[I 2025-09-01 15:57:39,671] Trial 2 finished with value: 0.5323403865992559 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 394, 'max_depth': 4, 'learning_rate': 0.14214333793545983, 'subsample': 0.8131257183514556, 'colsample_bytree': 0.6200076270075697, 'min_child_weight': 7, 'gamma': 3.4129256212255425, 'reg_alpha': 1.7042965114014081, 'reg_lambda': 1.1773668981242087}
Best xgb F1 score (positive class): 0.5618


[I 2025-09-01 15:59:49,772] A new study created in memory with name: no-name-c0e07df6-1057-4d51-b033-d895efb8dce0
[I 2025-09-01 15:59:49,824] Trial 0 finished with value: 0.5007220333475164 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5007220333475164.


xgb test accuracy: 0.5877
xgb test F1 (positive): 0.5278

--- Optimizing DT ---


[I 2025-09-01 15:59:50,352] Trial 1 finished with value: 0.4968166902579077 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5007220333475164.
[I 2025-09-01 15:59:50,400] Trial 2 finished with value: 0.5826043014728539 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5826043014728539.
[I 2025-09-01 15:59:50,431] Trial 3 finished with value: 0.6204843298021657 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6204843298021657.
[I 2025-09-01 15:59:50,458] Trial 4 finished with value: 0.40571499830759095 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6589
dt test accuracy: 0.6448
dt test F1 (positive): 0.6957

OUTER FOLD 3/5
Train size: 1818, Test size: 594
Class distribution in test set: {'non-void': np.int64(436), 'void': np.int64(158)}

--- Optimizing RF ---


[I 2025-09-01 15:59:54,777] Trial 0 finished with value: 0.6579248735136446 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6579248735136446.
[I 2025-09-01 15:59:56,226] Trial 1 finished with value: 0.6610389202010576 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6610389202010576.
[I 2025-09-01 16:00:05,127] Trial 2 finished with value: 0.6501210765509239 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6610389202010576.
[I 2025-09-01 16:00:15,064] Trial 3 finished with value: 0.6382824823641374 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 224, 'max_depth': 3, 'min_samples_split': 16, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6642


[I 2025-09-01 16:02:01,991] A new study created in memory with name: no-name-5ba0b86e-6002-46ae-bfc3-3d32231bc830


rf test accuracy: 0.7340
rf test F1 (positive): 0.5269

--- Optimizing XGB ---


[I 2025-09-01 16:02:05,775] Trial 0 finished with value: 0.6292421497458909 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6292421497458909.
[I 2025-09-01 16:02:07,785] Trial 1 finished with value: 0.6220444291761719 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6292421497458909.
[I 2025-09-01 16:02:09,781] Trial 2 finished with value: 0.6169556981143196 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 165, 'max_depth': 11, 'learning_rate': 0.026411465232795833, 'subsample': 0.9777543984480053, 'colsample_bytree': 0.6468562615498967, 'min_child_weight': 3, 'gamma': 4.722168057481616, 'reg_alpha': 1.632393267947069, 'reg_lambda': 0.5029437330178884}
Best xgb F1 score (positive class): 0.6598


[I 2025-09-01 16:04:47,622] A new study created in memory with name: no-name-586aafa8-d298-4c15-9213-0b8d3fbc9f31
[I 2025-09-01 16:04:47,670] Trial 0 finished with value: 0.5677187173130378 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5677187173130378.


xgb test accuracy: 0.6852
xgb test F1 (positive): 0.4762

--- Optimizing DT ---


[I 2025-09-01 16:04:48,178] Trial 1 finished with value: 0.5423094573711374 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5677187173130378.
[I 2025-09-01 16:04:48,223] Trial 2 finished with value: 0.6299642153155918 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6299642153155918.
[I 2025-09-01 16:04:48,253] Trial 3 finished with value: 0.6706697840786259 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6706697840786259.
[I 2025-09-01 16:04:48,281] Trial 4 finished with value: 0.6468815589361322 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 13, 'min_samples_leaf': 7, 'max_features': None, 'splitter': 'random'}
Best dt F1 score (positive class): 0.6859
dt test accuracy: 0.5084
dt test F1 (positive): 0.4729

OUTER FOLD 4/5
Train size: 1842, Test size: 570
Class distribution in test set: {'non-void': np.int64(341), 'void': np.int64(229)}

--- Optimizing RF ---


[I 2025-09-01 16:04:51,752] Trial 0 finished with value: 0.5835464609621909 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5835464609621909.
[I 2025-09-01 16:04:53,212] Trial 1 finished with value: 0.6099986770024118 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6099986770024118.
[I 2025-09-01 16:05:02,119] Trial 2 finished with value: 0.5761878396278992 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6099986770024118.
[I 2025-09-01 16:05:12,219] Trial 3 finished with value: 0.569560419074407 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 318, 'max_depth': 3, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'bootstrap': True}
Best rf F1 score (positive class): 0.6223


[I 2025-09-01 16:07:22,463] A new study created in memory with name: no-name-6e1358f7-5ed7-4a79-89a1-fc49f24b124c


rf test accuracy: 0.6860
rf test F1 (positive): 0.5536

--- Optimizing XGB ---


[I 2025-09-01 16:07:26,125] Trial 0 finished with value: 0.5548817005900556 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5548817005900556.
[I 2025-09-01 16:07:28,359] Trial 1 finished with value: 0.5404049445865302 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5548817005900556.
[I 2025-09-01 16:07:30,511] Trial 2 finished with value: 0.5591002692620236 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 264, 'max_depth': 7, 'learning_rate': 0.1631273578473762, 'subsample': 0.6351627961488784, 'colsample_bytree': 0.7824936169233744, 'min_child_weight': 1, 'gamma': 2.3565648626755773, 'reg_alpha': 1.234794556911147, 'reg_lambda': 1.4166201428873948}
Best xgb F1 score (positive class): 0.5734


[I 2025-09-01 16:10:10,886] A new study created in memory with name: no-name-31fe006d-5fa4-46a6-92f2-ee2d3951efb2
[I 2025-09-01 16:10:10,933] Trial 0 finished with value: 0.4511785892835934 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4511785892835934.


xgb test accuracy: 0.6737
xgb test F1 (positive): 0.5027

--- Optimizing DT ---


[I 2025-09-01 16:10:11,478] Trial 1 finished with value: 0.48549390137443527 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.48549390137443527.
[I 2025-09-01 16:10:11,523] Trial 2 finished with value: 0.528687872929795 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.528687872929795.
[I 2025-09-01 16:10:11,553] Trial 3 finished with value: 0.6130881841193268 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6130881841193268.
[I 2025-09-01 16:10:11,580] Trial 4 finished with value: 0.40628741473786706 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max

Best dt params: {'criterion': 'gini', 'max_depth': 4, 'min_samples_split': 16, 'min_samples_leaf': 10, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6541
dt test accuracy: 0.6825
dt test F1 (positive): 0.6057

OUTER FOLD 5/5
Train size: 2045, Test size: 367
Class distribution in test set: {'non-void': np.int64(202), 'void': np.int64(165)}

--- Optimizing RF ---


[I 2025-09-01 16:10:15,298] Trial 0 finished with value: 0.5868867634555232 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5868867634555232.
[I 2025-09-01 16:10:16,840] Trial 1 finished with value: 0.6100344961637489 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6100344961637489.
[I 2025-09-01 16:10:27,214] Trial 2 finished with value: 0.5634703656575074 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6100344961637489.
[I 2025-09-01 16:10:39,307] Trial 3 finished with value: 0.5627993899763667 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 424, 'max_depth': 3, 'min_samples_split': 18, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6109


[I 2025-09-01 16:13:32,348] A new study created in memory with name: no-name-5532aa95-b521-4a7b-8dbd-b04da48c944b


rf test accuracy: 0.7003
rf test F1 (positive): 0.6746

--- Optimizing XGB ---


[I 2025-09-01 16:13:36,595] Trial 0 finished with value: 0.5460858380333918 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5460858380333918.
[I 2025-09-01 16:13:38,844] Trial 1 finished with value: 0.554887657570601 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.554887657570601.
[I 2025-09-01 16:13:40,980] Trial 2 finished with value: 0.5512974113545309 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.65

Best xgb params: {'n_estimators': 110, 'max_depth': 12, 'learning_rate': 0.17370220706835007, 'subsample': 0.8624266177504052, 'colsample_bytree': 0.8735024117681786, 'min_child_weight': 3, 'gamma': 3.4044599281828924, 'reg_alpha': 0.3398051739804243, 'reg_lambda': 0.8963814323766668}
Best xgb F1 score (positive class): 0.5797


[I 2025-09-01 16:15:32,287] A new study created in memory with name: no-name-147f5d44-63f5-4442-acaf-6e0c94b8b108
[I 2025-09-01 16:15:32,339] Trial 0 finished with value: 0.49724594197200656 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.49724594197200656.


xgb test accuracy: 0.6730
xgb test F1 (positive): 0.6591

--- Optimizing DT ---


[I 2025-09-01 16:15:32,949] Trial 1 finished with value: 0.49463235294117647 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.49724594197200656.
[I 2025-09-01 16:15:33,006] Trial 2 finished with value: 0.5523621333130814 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5523621333130814.
[I 2025-09-01 16:15:33,054] Trial 3 finished with value: 0.47168380095324364 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5523621333130814.
[I 2025-09-01 16:15:33,091] Trial 4 finished with value: 0.4106879612896274 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'm

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6413
dt test accuracy: 0.6730
dt test F1 (positive): 0.6809

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.6958 Â± 0.0239
f1_positive       : 0.6103 Â± 0.0657
precision_positive: 0.6279 Â± 0.0735
recall_positive   : 0.5993 Â± 0.0831
f1_macro          : 0.6758 Â± 0.0166
Individual fold accuracies: ['0.6887', '0.6702', '0.7340', '0.6860', '0.7003']
Individual fold F1 (pos): ['0.6558', '0.6406', '0.5269', '0.5536', '0.6746']

XGB Results:
----------------------------------------
accuracy          : 0.6597 Â± 0.0405
f1_positive       : 0.5589 Â± 0.0805
precision_positive: 0.5894 Â± 0.0928
recall_positive   : 0.5462 Â± 0.1151
f1_macro          : 0.6364 Â± 0.0383
Individual fold accuracies: ['0.6789', '0.5877', '0

[I 2025-09-01 16:15:37,360] Trial 0 finished with value: 0.5816683457952762 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5816683457952762.
[I 2025-09-01 16:15:39,623] Trial 1 finished with value: 0.6166707502418883 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6166707502418883.
[I 2025-09-01 16:15:59,405] Trial 2 finished with value: 0.5815136106275346 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6166707502418883.
[I 2025-09-01 16:16:25,284] Trial 3 finished with value: 0.5687053409161186 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 415, 'max_depth': 3, 'min_samples_split': 18, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6184


[I 2025-09-01 16:21:30,291] A new study created in memory with name: no-name-fa7a0314-cc44-428a-907e-d329e076f9e1


rf test accuracy: 0.6202
rf test F1 (positive): 0.4388

--- Optimizing XGB ---


[I 2025-09-01 16:21:36,669] Trial 0 finished with value: 0.5148766749754529 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5148766749754529.
[I 2025-09-01 16:21:39,555] Trial 1 finished with value: 0.4927142456769589 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5148766749754529.
[I 2025-09-01 16:21:43,070] Trial 2 finished with value: 0.5137369062503218 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 196, 'max_depth': 12, 'learning_rate': 0.019372166284625944, 'subsample': 0.6926653108768327, 'colsample_bytree': 0.6397536670461723, 'min_child_weight': 5, 'gamma': 4.519424811177247, 'reg_alpha': 1.8119479751257943, 'reg_lambda': 1.6821099117249774}
Best xgb F1 score (positive class): 0.5646


[I 2025-09-01 16:26:48,274] A new study created in memory with name: no-name-bdaed543-711c-436f-be81-654d34c3e802
[I 2025-09-01 16:26:48,352] Trial 0 finished with value: 0.4968491431923121 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4968491431923121.


xgb test accuracy: 0.6384
xgb test F1 (positive): 0.4335

--- Optimizing DT ---


[I 2025-09-01 16:26:49,558] Trial 1 finished with value: 0.5190706805469033 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5190706805469033.
[I 2025-09-01 16:26:49,639] Trial 2 finished with value: 0.5891200520818717 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5891200520818717.
[I 2025-09-01 16:26:49,684] Trial 3 finished with value: 0.6209783458816114 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6209783458816114.
[I 2025-09-01 16:26:49,724] Trial 4 finished with value: 0.6475788723028252 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 17, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6637
dt test accuracy: 0.6495
dt test F1 (positive): 0.6634

OUTER FOLD 2/5
Train size: 3819, Test size: 949
Class distribution in test set: {'non-void': np.int64(587), 'void': np.int64(362)}

--- Optimizing RF ---


[I 2025-09-01 16:27:02,934] Trial 0 finished with value: 0.6100119082506091 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6100119082506091.
[I 2025-09-01 16:27:05,024] Trial 1 finished with value: 0.6299240738343318 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6299240738343318.
[I 2025-09-01 16:27:24,678] Trial 2 finished with value: 0.611465291519753 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6299240738343318.
[I 2025-09-01 16:27:50,307] Trial 3 finished with value: 0.6023581412700236 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6299


[I 2025-09-01 16:35:26,326] A new study created in memory with name: no-name-cb992203-06d9-498f-8dde-c26707e9549a


rf test accuracy: 0.7176
rf test F1 (positive): 0.6278

--- Optimizing XGB ---


[I 2025-09-01 16:35:32,845] Trial 0 finished with value: 0.5845920761764729 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5845920761764729.
[I 2025-09-01 16:35:35,863] Trial 1 finished with value: 0.5825049584522256 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5845920761764729.
[I 2025-09-01 16:35:39,483] Trial 2 finished with value: 0.5845732934117808 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 331, 'max_depth': 6, 'learning_rate': 0.012413189635294229, 'subsample': 0.7243929286862649, 'colsample_bytree': 0.7300733288106989, 'min_child_weight': 8, 'gamma': 3.1877873567760657, 'reg_alpha': 1.774425485152653, 'reg_lambda': 0.9444298503238986}
Best xgb F1 score (positive class): 0.6205


[I 2025-09-01 16:41:19,559] A new study created in memory with name: no-name-2f52747c-f7ed-4d23-8476-dea95b8965b0
[I 2025-09-01 16:41:19,640] Trial 0 finished with value: 0.5463494093464566 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5463494093464566.


xgb test accuracy: 0.6438
xgb test F1 (positive): 0.5266

--- Optimizing DT ---


[I 2025-09-01 16:41:20,890] Trial 1 finished with value: 0.5094999826611751 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5463494093464566.
[I 2025-09-01 16:41:20,971] Trial 2 finished with value: 0.5824730798660552 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5824730798660552.
[I 2025-09-01 16:41:21,016] Trial 3 finished with value: 0.6270035619987663 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6270035619987663.
[I 2025-09-01 16:41:21,055] Trial 4 finished with value: 0.6394230088782717 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 10, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6491
dt test accuracy: 0.7313
dt test F1 (positive): 0.6483

OUTER FOLD 3/5
Train size: 3855, Test size: 913
Class distribution in test set: {'non-void': np.int64(503), 'void': np.int64(410)}

--- Optimizing RF ---


[I 2025-09-01 16:41:28,418] Trial 0 finished with value: 0.5923470326446384 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5923470326446384.
[I 2025-09-01 16:41:30,640] Trial 1 finished with value: 0.5970913844018283 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5970913844018283.
[I 2025-09-01 16:41:50,662] Trial 2 finished with value: 0.5930922605465568 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5970913844018283.
[I 2025-09-01 16:42:15,969] Trial 3 finished with value: 0.5828754398621049 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 198, 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 7, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6295


[I 2025-09-01 16:47:27,792] A new study created in memory with name: no-name-5ba4cba4-66df-4fab-a512-d98054d71336


rf test accuracy: 0.6922
rf test F1 (positive): 0.7153

--- Optimizing XGB ---


[I 2025-09-01 16:47:34,652] Trial 0 finished with value: 0.5838376568215596 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5838376568215596.
[I 2025-09-01 16:47:38,235] Trial 1 finished with value: 0.5775976584487222 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5838376568215596.
[I 2025-09-01 16:47:41,505] Trial 2 finished with value: 0.5742120336086306 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 298, 'max_depth': 4, 'learning_rate': 0.01036190622392575, 'subsample': 0.6073248792362046, 'colsample_bytree': 0.9848658569074349, 'min_child_weight': 7, 'gamma': 0.4805348372562509, 'reg_alpha': 0.008911233051175853, 'reg_lambda': 0.8703147058466669}
Best xgb F1 score (positive class): 0.5927


[I 2025-09-01 16:51:42,125] A new study created in memory with name: no-name-07ce4bc1-0a4a-46f7-8b98-6161ef8e2bae
[I 2025-09-01 16:51:42,208] Trial 0 finished with value: 0.5393525625981256 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5393525625981256.


xgb test accuracy: 0.7130
xgb test F1 (positive): 0.7207

--- Optimizing DT ---


[I 2025-09-01 16:51:43,417] Trial 1 finished with value: 0.5327326115425642 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5393525625981256.
[I 2025-09-01 16:51:43,498] Trial 2 finished with value: 0.5408191664278093 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5408191664278093.
[I 2025-09-01 16:51:43,544] Trial 3 finished with value: 0.6086686311507384 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6086686311507384.
[I 2025-09-01 16:51:43,582] Trial 4 finished with value: 0.6253855264581447 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 17, 'min_samples_leaf': 5, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6563
dt test accuracy: 0.6835
dt test F1 (positive): 0.7124

OUTER FOLD 4/5
Train size: 4086, Test size: 682
Class distribution in test set: {'non-void': np.int64(378), 'void': np.int64(304)}

--- Optimizing RF ---


[I 2025-09-01 16:51:57,990] Trial 0 finished with value: 0.5657886848513628 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5657886848513628.
[I 2025-09-01 16:52:00,272] Trial 1 finished with value: 0.6066925376898441 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6066925376898441.
[I 2025-09-01 16:52:21,589] Trial 2 finished with value: 0.586435041600568 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6066925376898441.
[I 2025-09-01 16:52:48,885] Trial 3 finished with value: 0.5790846866565452 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 313, 'max_depth': 3, 'min_samples_split': 10, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'bootstrap': True}
Best rf F1 score (positive class): 0.6141


[I 2025-09-01 16:57:27,207] A new study created in memory with name: no-name-52aca87c-25f8-4729-b338-6d29d2feba83


rf test accuracy: 0.7581
rf test F1 (positive): 0.7273

--- Optimizing XGB ---


[I 2025-09-01 16:57:33,842] Trial 0 finished with value: 0.5420144677493041 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5420144677493041.
[I 2025-09-01 16:57:36,886] Trial 1 finished with value: 0.5373674765021664 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5420144677493041.
[I 2025-09-01 16:57:40,171] Trial 2 finished with value: 0.5551636764293129 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 192, 'max_depth': 3, 'learning_rate': 0.01291994187790851, 'subsample': 0.90452928021914, 'colsample_bytree': 0.9710403588505682, 'min_child_weight': 9, 'gamma': 1.3360449211014016, 'reg_alpha': 0.6700120618244569, 'reg_lambda': 0.5935755430736293}
Best xgb F1 score (positive class): 0.5945


[I 2025-09-01 17:00:27,523] A new study created in memory with name: no-name-c0113afa-21d6-4f1b-b4ee-4ba32dfde809
[I 2025-09-01 17:00:27,611] Trial 0 finished with value: 0.4809203076518344 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4809203076518344.


xgb test accuracy: 0.7243
xgb test F1 (positive): 0.6667

--- Optimizing DT ---


[I 2025-09-01 17:00:28,945] Trial 1 finished with value: 0.49517424921445713 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.49517424921445713.
[I 2025-09-01 17:00:29,028] Trial 2 finished with value: 0.5416628024862505 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5416628024862505.
[I 2025-09-01 17:00:29,077] Trial 3 finished with value: 0.6208859343219725 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6208859343219725.
[I 2025-09-01 17:00:29,116] Trial 4 finished with value: 0.399089257164761 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max

Best dt params: {'criterion': 'entropy', 'max_depth': 3, 'min_samples_split': 11, 'min_samples_leaf': 4, 'max_features': None, 'splitter': 'random'}
Best dt F1 score (positive class): 0.6514
dt test accuracy: 0.7214
dt test F1 (positive): 0.7246

OUTER FOLD 5/5
Train size: 3534, Test size: 1234
Class distribution in test set: {'non-void': np.int64(858), 'void': np.int64(376)}

--- Optimizing RF ---


[I 2025-09-01 17:00:33,588] Trial 0 finished with value: 0.6183759165796224 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6183759165796224.
[I 2025-09-01 17:00:35,656] Trial 1 finished with value: 0.6552686878577539 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6552686878577539.
[I 2025-09-01 17:00:53,747] Trial 2 finished with value: 0.6221068802062364 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6552686878577539.
[I 2025-09-01 17:01:16,129] Trial 3 finished with value: 0.6127267910831693 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 438, 'max_depth': 4, 'min_samples_split': 19, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6571


[I 2025-09-01 17:06:00,196] A new study created in memory with name: no-name-94c723f0-0521-406e-8bd0-2d58f66220de


rf test accuracy: 0.7504
rf test F1 (positive): 0.6342

--- Optimizing XGB ---


[I 2025-09-01 17:06:06,189] Trial 0 finished with value: 0.5930748531628791 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5930748531628791.
[I 2025-09-01 17:06:09,624] Trial 1 finished with value: 0.5663374624815164 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5930748531628791.
[I 2025-09-01 17:06:12,599] Trial 2 finished with value: 0.5864498361725629 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 297, 'max_depth': 3, 'learning_rate': 0.012081460388966592, 'subsample': 0.9520528248401178, 'colsample_bytree': 0.7344817072933508, 'min_child_weight': 10, 'gamma': 2.194061536947019, 'reg_alpha': 0.09610931064597383, 'reg_lambda': 1.2624893067189227}
Best xgb F1 score (positive class): 0.6449


[I 2025-09-01 17:09:28,621] A new study created in memory with name: no-name-722e96af-06fa-4de3-9530-4ec494daee48
[I 2025-09-01 17:09:28,696] Trial 0 finished with value: 0.5369649075430586 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5369649075430586.


xgb test accuracy: 0.7350
xgb test F1 (positive): 0.6065

--- Optimizing DT ---


[I 2025-09-01 17:09:29,857] Trial 1 finished with value: 0.5447131822989798 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5447131822989798.
[I 2025-09-01 17:09:29,932] Trial 2 finished with value: 0.5978807179177547 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5978807179177547.
[I 2025-09-01 17:09:29,974] Trial 3 finished with value: 0.6767496441242974 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6767496441242974.
[I 2025-09-01 17:09:30,011] Trial 4 finished with value: 0.6539821885788483 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6767
dt test accuracy: 0.7196
dt test F1 (positive): 0.6288

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7077 Â± 0.0556
f1_positive       : 0.6287 Â± 0.1154
precision_positive: 0.6507 Â± 0.0662
recall_positive   : 0.6475 Â± 0.2027
f1_macro          : 0.6887 Â± 0.0678
Individual fold accuracies: ['0.6202', '0.7176', '0.6922', '0.7581', '0.7504']
Individual fold F1 (pos): ['0.4388', '0.6278', '0.7153', '0.7273', '0.6342']

XGB Results:
----------------------------------------
accuracy          : 0.6909 Â± 0.0462
f1_positive       : 0.5908 Â± 0.1137
precision_positive: 0.6514 Â± 0.1145
recall_positive   : 0.5858 Â± 0.1957
f1_macro          : 0.6673 Â± 0.0609
Individual fold accuracies: ['0.6384', '0.6438', '

[I 2025-09-01 17:09:34,287] A new study created in memory with name: no-name-acf710bc-7622-4901-a905-27f9d4d0f0d2


Nested cross-validation for 1s_0.8
Positive class 'void' is encoded as: 1
Label mapping: {'non-void': np.int64(0), 'void': np.int64(1)}

Running nested cross-validation...
Starting Binary Nested Cross-Validation with separate optimization for each model...
Positive class: 'void' (encoded as 1)

OUTER FOLD 1/5
Train size: 10211, Test size: 1636
Class distribution in test set: {'non-void': np.int64(828), 'void': np.int64(808)}

--- Optimizing RF ---


[I 2025-09-01 17:09:39,551] Trial 0 finished with value: 0.5084354653439057 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5084354653439057.
[I 2025-09-01 17:09:44,370] Trial 1 finished with value: 0.5739099903239686 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5739099903239686.
[I 2025-09-01 17:10:39,255] Trial 2 finished with value: 0.5032852601561542 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5739099903239686.
[I 2025-09-01 17:11:56,757] Trial 3 finished with value: 0.4884114592715227 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 417, 'max_depth': 3, 'min_samples_split': 18, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.5745


[I 2025-09-01 17:25:54,650] A new study created in memory with name: no-name-1ab249a3-4ebf-4957-a14c-f0cad09bb492


rf test accuracy: 0.7366
rf test F1 (positive): 0.7113

--- Optimizing XGB ---


[I 2025-09-01 17:26:04,459] Trial 0 finished with value: 0.4931490933554072 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.4931490933554072.
[I 2025-09-01 17:26:09,012] Trial 1 finished with value: 0.488262663882864 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.4931490933554072.
[I 2025-09-01 17:26:13,815] Trial 2 finished with value: 0.49584991078591295 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 126, 'max_depth': 3, 'learning_rate': 0.03163393826748552, 'subsample': 0.9943435740037196, 'colsample_bytree': 0.8384389352084881, 'min_child_weight': 6, 'gamma': 1.050778051161564, 'reg_alpha': 1.1608090420507118, 'reg_lambda': 0.007160938008408918}
Best xgb F1 score (positive class): 0.5502


[I 2025-09-01 17:30:46,859] A new study created in memory with name: no-name-674d5cac-7ee1-4db1-b154-fb40b4e954b6
[I 2025-09-01 17:30:47,049] Trial 0 finished with value: 0.46910435197048383 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.46910435197048383.


xgb test accuracy: 0.7133
xgb test F1 (positive): 0.6648

--- Optimizing DT ---


[I 2025-09-01 17:30:50,576] Trial 1 finished with value: 0.45504113091001325 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.46910435197048383.
[I 2025-09-01 17:30:50,766] Trial 2 finished with value: 0.5447601338841217 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5447601338841217.
[I 2025-09-01 17:30:50,861] Trial 3 finished with value: 0.5024524769216879 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5447601338841217.
[I 2025-09-01 17:30:50,936] Trial 4 finished with value: 0.6377318614166159 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'ma

Best dt params: {'criterion': 'entropy', 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 10, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6418
dt test accuracy: 0.7286
dt test F1 (positive): 0.7168

OUTER FOLD 2/5
Train size: 9640, Test size: 2207
Class distribution in test set: {'non-void': np.int64(1174), 'void': np.int64(1033)}

--- Optimizing RF ---


[I 2025-09-01 17:31:08,562] Trial 0 finished with value: 0.568605253216251 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.568605253216251.
[I 2025-09-01 17:31:13,134] Trial 1 finished with value: 0.6054679280186327 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6054679280186327.
[I 2025-09-01 17:32:05,419] Trial 2 finished with value: 0.585824715099844 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6054679280186327.
[I 2025-09-01 17:33:23,003] Trial 3 finished with value: 0.5762218724342536 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features':

Best rf params: {'n_estimators': 419, 'max_depth': 4, 'min_samples_split': 19, 'min_samples_leaf': 10, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6271


[I 2025-09-01 17:53:58,059] A new study created in memory with name: no-name-c27620fd-1e1f-4e79-8e83-aa6a71491841


rf test accuracy: 0.6298
rf test F1 (positive): 0.5716

--- Optimizing XGB ---


[I 2025-09-01 17:54:07,082] Trial 0 finished with value: 0.5256503468098098 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5256503468098098.
[I 2025-09-01 17:54:11,227] Trial 1 finished with value: 0.5206388655865556 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5256503468098098.
[I 2025-09-01 17:54:16,051] Trial 2 finished with value: 0.5263384945277183 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 266, 'max_depth': 3, 'learning_rate': 0.020190037401322067, 'subsample': 0.960579097750231, 'colsample_bytree': 0.9576891450069979, 'min_child_weight': 6, 'gamma': 2.514848677974388, 'reg_alpha': 0.34934665523130604, 'reg_lambda': 0.6632478859799472}
Best xgb F1 score (positive class): 0.6173


[I 2025-09-01 17:58:33,937] A new study created in memory with name: no-name-a150858e-1147-450b-b49e-46f6f0622d7e
[I 2025-09-01 17:58:34,113] Trial 0 finished with value: 0.5615866539810419 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5615866539810419.


xgb test accuracy: 0.6099
xgb test F1 (positive): 0.5368

--- Optimizing DT ---


[I 2025-09-01 17:58:37,569] Trial 1 finished with value: 0.5071863066158863 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5615866539810419.
[I 2025-09-01 17:58:37,754] Trial 2 finished with value: 0.6096264545944888 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6096264545944888.
[I 2025-09-01 17:58:37,845] Trial 3 finished with value: 0.6560199343226651 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6560199343226651.
[I 2025-09-01 17:58:37,916] Trial 4 finished with value: 0.6466543898922504 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 16, 'min_samples_leaf': 8, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6671
dt test accuracy: 0.6362
dt test F1 (positive): 0.5897

OUTER FOLD 3/5
Train size: 8679, Test size: 3168
Class distribution in test set: {'non-void': np.int64(1908), 'void': np.int64(1260)}

--- Optimizing RF ---


[I 2025-09-01 17:58:53,611] Trial 0 finished with value: 0.576374941029015 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.576374941029015.
[I 2025-09-01 17:58:57,715] Trial 1 finished with value: 0.632437336702044 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.632437336702044.
[I 2025-09-01 17:59:43,492] Trial 2 finished with value: 0.595406584606016 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.632437336702044.
[I 2025-09-01 18:00:50,370] Trial 3 finished with value: 0.5667311217749641 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features': No

Best rf params: {'n_estimators': 237, 'max_depth': 3, 'min_samples_split': 19, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': True}
Best rf F1 score (positive class): 0.6347


[I 2025-09-01 20:14:39,712] A new study created in memory with name: no-name-ad7075a1-bb14-4477-badf-b71c34e3b494


rf test accuracy: 0.6985
rf test F1 (positive): 0.6110

--- Optimizing XGB ---


[I 2025-09-01 20:14:50,109] Trial 0 finished with value: 0.5342521089612837 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5342521089612837.
[I 2025-09-01 20:14:54,330] Trial 1 finished with value: 0.5437850534736687 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5437850534736687.
[I 2025-09-01 20:14:59,310] Trial 2 finished with value: 0.5446140062700389 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 68, 'max_depth': 3, 'learning_rate': 0.048126082755685855, 'subsample': 0.9003042006104494, 'colsample_bytree': 0.9110507805327926, 'min_child_weight': 7, 'gamma': 3.986294386497451, 'reg_alpha': 0.7315366699670792, 'reg_lambda': 0.20718943397744516}
Best xgb F1 score (positive class): 0.6315


[I 2025-09-01 20:18:16,541] A new study created in memory with name: no-name-eaaf8bac-ede7-4d67-89dc-835100dcd07c
[I 2025-09-01 20:18:16,702] Trial 0 finished with value: 0.5202223488290251 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5202223488290251.


xgb test accuracy: 0.6878
xgb test F1 (positive): 0.5860

--- Optimizing DT ---


[I 2025-09-01 20:18:19,818] Trial 1 finished with value: 0.5334166466717888 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5334166466717888.
[I 2025-09-01 20:18:19,980] Trial 2 finished with value: 0.5960514732813916 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5960514732813916.
[I 2025-09-01 20:18:20,064] Trial 3 finished with value: 0.560389068758336 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5960514732813916.
[I 2025-09-01 20:18:20,130] Trial 4 finished with value: 0.6726956366813411 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_f

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 19, 'min_samples_leaf': 2, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6754
dt test accuracy: 0.6370
dt test F1 (positive): 0.6420

OUTER FOLD 4/5
Train size: 10007, Test size: 1840
Class distribution in test set: {'non-void': np.int64(1220), 'void': np.int64(620)}

--- Optimizing RF ---


[I 2025-09-01 20:18:48,520] Trial 0 finished with value: 0.5719172862745551 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5719172862745551.
[I 2025-09-01 20:18:55,789] Trial 1 finished with value: 0.6045434372331518 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6045434372331518.
[I 2025-09-01 20:19:49,263] Trial 2 finished with value: 0.5781057520034522 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6045434372331518.
[I 2025-09-01 20:21:37,427] Trial 3 finished with value: 0.5712968318962716 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 190, 'max_depth': 3, 'min_samples_split': 19, 'min_samples_leaf': 1, 'max_features': 'sqrt', 'bootstrap': True}
Best rf F1 score (positive class): 0.6169


[I 2025-09-01 21:10:44,340] A new study created in memory with name: no-name-92f88b94-bc1e-413e-93ae-48e7b71fc862


rf test accuracy: 0.7261
rf test F1 (positive): 0.6141

--- Optimizing XGB ---


[I 2025-09-01 21:10:54,743] Trial 0 finished with value: 0.552175716692865 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.552175716692865.
[I 2025-09-01 21:10:59,055] Trial 1 finished with value: 0.5509124486491203 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.552175716692865.
[I 2025-09-01 21:11:04,178] Trial 2 finished with value: 0.5442476280208278 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.655

Best xgb params: {'n_estimators': 167, 'max_depth': 3, 'learning_rate': 0.01795915643952162, 'subsample': 0.8226078268995918, 'colsample_bytree': 0.7969055582218567, 'min_child_weight': 1, 'gamma': 0.8082316153291789, 'reg_alpha': 0.4786203435816153, 'reg_lambda': 1.6869581236230655}
Best xgb F1 score (positive class): 0.6232


[I 2025-09-01 21:15:22,748] A new study created in memory with name: no-name-693099ec-4e0c-4375-85a1-6c9dc0021355
[I 2025-09-01 21:15:22,942] Trial 0 finished with value: 0.5281440025788252 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5281440025788252.


xgb test accuracy: 0.7168
xgb test F1 (positive): 0.5868

--- Optimizing DT ---


[I 2025-09-01 21:15:26,712] Trial 1 finished with value: 0.5148156256691611 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5281440025788252.
[I 2025-09-01 21:15:26,900] Trial 2 finished with value: 0.6084518160832421 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6084518160832421.
[I 2025-09-01 21:15:26,996] Trial 3 finished with value: 0.6480662063925515 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6480662063925515.
[I 2025-09-01 21:15:27,070] Trial 4 finished with value: 0.6400254506539329 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 9, 'min_samples_leaf': 10, 'max_features': None, 'splitter': 'random'}
Best dt F1 score (positive class): 0.6764
dt test accuracy: 0.7815
dt test F1 (positive): 0.7000

OUTER FOLD 5/5
Train size: 8851, Test size: 2996
Class distribution in test set: {'non-void': np.int64(1936), 'void': np.int64(1060)}

--- Optimizing RF ---


[I 2025-09-01 21:15:44,322] Trial 0 finished with value: 0.5426306092287527 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5426306092287527.
[I 2025-09-01 21:15:48,566] Trial 1 finished with value: 0.5790600789383596 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5790600789383596.
[I 2025-09-01 21:16:35,841] Trial 2 finished with value: 0.5885478789398991 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 2 with value: 0.5885478789398991.
[I 2025-09-01 21:17:43,641] Trial 3 finished with value: 0.5707826847751938 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 285, 'max_depth': 4, 'min_samples_split': 10, 'min_samples_leaf': 10, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6201


[I 2025-09-01 21:52:28,190] A new study created in memory with name: no-name-0b18e72a-93e7-41c6-87d5-5ab352137e60


rf test accuracy: 0.6809
rf test F1 (positive): 0.6114

--- Optimizing XGB ---


[I 2025-09-01 21:52:36,451] Trial 0 finished with value: 0.5630650083140413 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5630650083140413.
[I 2025-09-01 21:52:40,298] Trial 1 finished with value: 0.5508199838227886 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5630650083140413.
[I 2025-09-01 21:52:44,478] Trial 2 finished with value: 0.5716274437923478 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 316, 'max_depth': 3, 'learning_rate': 0.019552915646991496, 'subsample': 0.7117376635580034, 'colsample_bytree': 0.7301906662915154, 'min_child_weight': 8, 'gamma': 4.938499284681214, 'reg_alpha': 1.0549651822564483, 'reg_lambda': 1.027938490805031}
Best xgb F1 score (positive class): 0.6039


[I 2025-09-01 21:56:45,620] A new study created in memory with name: no-name-2f8f2db6-2828-453e-8e80-9d7e24edf033
[I 2025-09-01 21:56:45,787] Trial 0 finished with value: 0.5189558627789921 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5189558627789921.


xgb test accuracy: 0.7313
xgb test F1 (positive): 0.6710

--- Optimizing DT ---


[I 2025-09-01 21:56:48,885] Trial 1 finished with value: 0.5007216714054153 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5189558627789921.
[I 2025-09-01 21:56:49,049] Trial 2 finished with value: 0.4798251966394346 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.5189558627789921.
[I 2025-09-01 21:56:49,131] Trial 3 finished with value: 0.4919746444083017 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.5189558627789921.
[I 2025-09-01 21:56:49,194] Trial 4 finished with value: 0.6432483548161221 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6432
dt test accuracy: 0.6973
dt test F1 (positive): 0.6518

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.6944 Â± 0.0423
f1_positive       : 0.6239 Â± 0.0520
precision_positive: 0.6296 Â± 0.0892
recall_positive   : 0.6272 Â± 0.0689
f1_macro          : 0.6822 Â± 0.0411
Individual fold accuracies: ['0.7366', '0.6298', '0.6985', '0.7261', '0.6809']
Individual fold F1 (pos): ['0.7113', '0.5716', '0.6110', '0.6141', '0.6114']

XGB Results:
----------------------------------------
accuracy          : 0.6918 Â± 0.0484
f1_positive       : 0.6091 Â± 0.0574
precision_positive: 0.6360 Â± 0.0857
recall_positive   : 0.5971 Â± 0.1080
f1_macro          : 0.6765 Â± 0.0475
Individual fold accuracies: ['0.7133', '0.6099',

[I 2025-09-01 21:57:01,257] Trial 0 finished with value: 0.6216896725371303 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6216896725371303.
[I 2025-09-01 21:57:02,430] Trial 1 finished with value: 0.6394986449864498 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6394986449864498.
[I 2025-09-01 21:57:07,210] Trial 2 finished with value: 0.6217689090254369 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6394986449864498.
[I 2025-09-01 21:57:12,015] Trial 3 finished with value: 0.6020720085871368 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 249, 'max_depth': 4, 'min_samples_split': 12, 'min_samples_leaf': 2, 'max_features': 'log2', 'bootstrap': False}
Best rf F1 score (positive class): 0.6497


[I 2025-09-01 21:58:31,504] A new study created in memory with name: no-name-276ddd62-1d22-451b-b9bd-dac3b82baa08


rf test accuracy: 0.5762
rf test F1 (positive): 0.5294

--- Optimizing XGB ---


[I 2025-09-01 21:58:33,521] Trial 0 finished with value: 0.5866622796270476 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5866622796270476.
[I 2025-09-01 21:58:35,212] Trial 1 finished with value: 0.5917136832750477 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5917136832750477.
[I 2025-09-01 21:58:36,499] Trial 2 finished with value: 0.6034765365161842 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 360, 'max_depth': 8, 'learning_rate': 0.07630490127156113, 'subsample': 0.7282977034916852, 'colsample_bytree': 0.8231118187966076, 'min_child_weight': 2, 'gamma': 0.532819126765206, 'reg_alpha': 0.4921365627044161, 'reg_lambda': 0.8450621800641857}
Best xgb F1 score (positive class): 0.6100


[I 2025-09-01 22:00:06,314] A new study created in memory with name: no-name-e5808132-4eb5-4c68-a716-9929b83c89f2
[I 2025-09-01 22:00:06,348] Trial 0 finished with value: 0.4967468257240615 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4967468257240615.


xgb test accuracy: 0.5497
xgb test F1 (positive): 0.4769

--- Optimizing DT ---


[I 2025-09-01 22:00:06,618] Trial 1 finished with value: 0.4848575842491825 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.4967468257240615.
[I 2025-09-01 22:00:06,651] Trial 2 finished with value: 0.6273137361444195 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6273137361444195.
[I 2025-09-01 22:00:06,676] Trial 3 finished with value: 0.664345065272211 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.664345065272211.
[I 2025-09-01 22:00:06,698] Trial 4 finished with value: 0.6709981869877456 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_fe

Best dt params: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6710
dt test accuracy: 0.5894
dt test F1 (positive): 0.6076

OUTER FOLD 2/5
Train size: 920, Test size: 269
Class distribution in test set: {'non-void': np.int64(198), 'void': np.int64(71)}

--- Optimizing RF ---


[I 2025-09-01 22:00:09,706] Trial 0 finished with value: 0.6156858102576132 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6156858102576132.
[I 2025-09-01 22:00:10,842] Trial 1 finished with value: 0.626165072617426 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.626165072617426.
[I 2025-09-01 22:00:15,025] Trial 2 finished with value: 0.6202196627216675 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.626165072617426.
[I 2025-09-01 22:00:19,255] Trial 3 finished with value: 0.6115145596192272 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features':

Best rf params: {'n_estimators': 307, 'max_depth': 4, 'min_samples_split': 15, 'min_samples_leaf': 4, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6324


[I 2025-09-01 22:01:57,780] A new study created in memory with name: no-name-cb4f912c-96d1-46dc-a8d9-a065aa787612


rf test accuracy: 0.7732
rf test F1 (positive): 0.5793

--- Optimizing XGB ---


[I 2025-09-01 22:02:00,461] Trial 0 finished with value: 0.5848812772701346 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5848812772701346.
[I 2025-09-01 22:02:02,190] Trial 1 finished with value: 0.5792478116703011 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5848812772701346.
[I 2025-09-01 22:02:03,725] Trial 2 finished with value: 0.5850295801148543 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 467, 'max_depth': 10, 'learning_rate': 0.012219811160283485, 'subsample': 0.7218520073542559, 'colsample_bytree': 0.7705413902968903, 'min_child_weight': 2, 'gamma': 4.6041885418822, 'reg_alpha': 1.9949396569619464, 'reg_lambda': 1.245098664363596}
Best xgb F1 score (positive class): 0.6237


[I 2025-09-01 22:04:07,229] A new study created in memory with name: no-name-0d76dc9e-8dc2-412a-a565-ca862bc09b25
[I 2025-09-01 22:04:07,265] Trial 0 finished with value: 0.517636293653962 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.517636293653962.


xgb test accuracy: 0.7955
xgb test F1 (positive): 0.6099

--- Optimizing DT ---


[I 2025-09-01 22:04:07,521] Trial 1 finished with value: 0.4735549065962082 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.517636293653962.
[I 2025-09-01 22:04:07,552] Trial 2 finished with value: 0.5978870755974928 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5978870755974928.
[I 2025-09-01 22:04:07,576] Trial 3 finished with value: 0.6529197192470988 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6529197192470988.
[I 2025-09-01 22:04:07,598] Trial 4 finished with value: 0.6829156109561202 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_f

Best dt params: {'criterion': 'entropy', 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 7, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6843
dt test accuracy: 0.7546
dt test F1 (positive): 0.6163

OUTER FOLD 3/5
Train size: 909, Test size: 280
Class distribution in test set: {'non-void': np.int64(158), 'void': np.int64(122)}

--- Optimizing RF ---


[I 2025-09-01 22:04:10,606] Trial 0 finished with value: 0.5631411818735566 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5631411818735566.
[I 2025-09-01 22:04:11,740] Trial 1 finished with value: 0.6148094474274732 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6148094474274732.
[I 2025-09-01 22:04:15,812] Trial 2 finished with value: 0.6132946859903381 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6148094474274732.
[I 2025-09-01 22:04:19,931] Trial 3 finished with value: 0.5930920206695919 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 456, 'max_depth': 3, 'min_samples_split': 18, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6196


[I 2025-09-01 22:05:51,224] A new study created in memory with name: no-name-6c3aadfd-3b42-4d50-b170-b63670f338ff


rf test accuracy: 0.6786
rf test F1 (positive): 0.5872

--- Optimizing XGB ---


[I 2025-09-01 22:05:53,554] Trial 0 finished with value: 0.5395335766524653 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5395335766524653.
[I 2025-09-01 22:05:55,332] Trial 1 finished with value: 0.5405040887645464 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5405040887645464.
[I 2025-09-01 22:05:56,839] Trial 2 finished with value: 0.5496755457663872 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 462, 'max_depth': 7, 'learning_rate': 0.15921728208236582, 'subsample': 0.8302077581968994, 'colsample_bytree': 0.7358910134170531, 'min_child_weight': 2, 'gamma': 4.518293128819064, 'reg_alpha': 1.7076233962472063, 'reg_lambda': 1.2004823295027718}
Best xgb F1 score (positive class): 0.6046


[I 2025-09-01 22:07:18,224] A new study created in memory with name: no-name-bc9cfc9c-515a-452e-91aa-35027e35bd73
[I 2025-09-01 22:07:18,255] Trial 0 finished with value: 0.5777862660215601 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5777862660215601.


xgb test accuracy: 0.6786
xgb test F1 (positive): 0.6250

--- Optimizing DT ---


[I 2025-09-01 22:07:18,471] Trial 1 finished with value: 0.49577306533021814 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5777862660215601.
[I 2025-09-01 22:07:18,504] Trial 2 finished with value: 0.48256724809916296 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.5777862660215601.
[I 2025-09-01 22:07:18,538] Trial 3 finished with value: 0.6083102567228278 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6083102567228278.
[I 2025-09-01 22:07:18,571] Trial 4 finished with value: 0.6615092422136115 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'ma

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 17, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6655
dt test accuracy: 0.6286
dt test F1 (positive): 0.6312

OUTER FOLD 4/5
Train size: 896, Test size: 293
Class distribution in test set: {'non-void': np.int64(186), 'void': np.int64(107)}

--- Optimizing RF ---


[I 2025-09-01 22:07:23,024] Trial 0 finished with value: 0.5884120764637609 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5884120764637609.
[I 2025-09-01 22:07:24,177] Trial 1 finished with value: 0.608757653258932 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.608757653258932.
[I 2025-09-01 22:07:28,421] Trial 2 finished with value: 0.5922438247264051 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.608757653258932.
[I 2025-09-01 22:07:32,610] Trial 3 finished with value: 0.589570219302546 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features': 

Best rf params: {'n_estimators': 241, 'max_depth': 4, 'min_samples_split': 19, 'min_samples_leaf': 4, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6174


[I 2025-09-01 22:09:10,154] A new study created in memory with name: no-name-92a850e1-852f-4aed-9f97-632fc838dd68


rf test accuracy: 0.7372
rf test F1 (positive): 0.7027

--- Optimizing XGB ---


[I 2025-09-01 22:09:12,301] Trial 0 finished with value: 0.5747973288498 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5747973288498.
[I 2025-09-01 22:09:14,110] Trial 1 finished with value: 0.5815333014473215 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5815333014473215.
[I 2025-09-01 22:09:15,581] Trial 2 finished with value: 0.5710357073653123 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.655797

Best xgb params: {'n_estimators': 366, 'max_depth': 4, 'learning_rate': 0.021698698484948094, 'subsample': 0.8337377980053566, 'colsample_bytree': 0.7811766287781392, 'min_child_weight': 7, 'gamma': 4.172117642877876, 'reg_alpha': 1.98313311919638, 'reg_lambda': 1.006407233424485}
Best xgb F1 score (positive class): 0.6085


[I 2025-09-01 22:11:03,710] A new study created in memory with name: no-name-7ae323f4-c697-4a19-a04a-bf9d09d692c2
[I 2025-09-01 22:11:03,741] Trial 0 finished with value: 0.5310111384145786 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5310111384145786.


xgb test accuracy: 0.7338
xgb test F1 (positive): 0.6880

--- Optimizing DT ---


[I 2025-09-01 22:11:03,979] Trial 1 finished with value: 0.5540176002849041 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5540176002849041.
[I 2025-09-01 22:11:04,009] Trial 2 finished with value: 0.589564937013555 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.589564937013555.
[I 2025-09-01 22:11:04,034] Trial 3 finished with value: 0.6007391057810665 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6007391057810665.
[I 2025-09-01 22:11:04,055] Trial 4 finished with value: 0.6705284143872964 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_fe

Best dt params: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6705
dt test accuracy: 0.6826
dt test F1 (positive): 0.6690

OUTER FOLD 5/5
Train size: 993, Test size: 196
Class distribution in test set: {'non-void': np.int64(110), 'void': np.int64(86)}

--- Optimizing RF ---


[I 2025-09-01 22:11:06,999] Trial 0 finished with value: 0.5404824825585846 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5404824825585846.
[I 2025-09-01 22:11:08,289] Trial 1 finished with value: 0.5675597376931368 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5675597376931368.
[I 2025-09-01 22:11:13,219] Trial 2 finished with value: 0.5549504593261485 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5675597376931368.
[I 2025-09-01 22:11:18,081] Trial 3 finished with value: 0.5554724457834352 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 271, 'max_depth': 4, 'min_samples_split': 16, 'min_samples_leaf': 3, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.5839


[I 2025-09-01 22:13:27,324] A new study created in memory with name: no-name-22f8d8a8-7a05-481e-8ac8-a432c337c2c3


rf test accuracy: 0.7347
rf test F1 (positive): 0.7143

--- Optimizing XGB ---


[I 2025-09-01 22:13:29,985] Trial 0 finished with value: 0.5082409349715312 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5082409349715312.
[I 2025-09-01 22:13:31,643] Trial 1 finished with value: 0.5056534752244762 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5082409349715312.
[I 2025-09-01 22:13:33,137] Trial 2 finished with value: 0.49677149677149673 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0

Best xgb params: {'n_estimators': 285, 'max_depth': 3, 'learning_rate': 0.018540549595890975, 'subsample': 0.7642493335137185, 'colsample_bytree': 0.7989851903953397, 'min_child_weight': 3, 'gamma': 4.718114863309929, 'reg_alpha': 1.6518382317576705, 'reg_lambda': 0.7764158782475581}
Best xgb F1 score (positive class): 0.5616


[I 2025-09-01 22:15:23,409] A new study created in memory with name: no-name-a0048468-23b2-4e33-829d-0d9621bdb33a
[I 2025-09-01 22:15:23,441] Trial 0 finished with value: 0.5170520536374195 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5170520536374195.


xgb test accuracy: 0.7449
xgb test F1 (positive): 0.7159

--- Optimizing DT ---


[I 2025-09-01 22:15:23,702] Trial 1 finished with value: 0.5092030806316521 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5170520536374195.
[I 2025-09-01 22:15:23,733] Trial 2 finished with value: 0.5264786900765024 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5264786900765024.
[I 2025-09-01 22:15:23,756] Trial 3 finished with value: 0.605372263144204 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.605372263144204.
[I 2025-09-01 22:15:23,779] Trial 4 finished with value: 0.4021077792264233 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_fe

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 17, 'min_samples_leaf': 6, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6451
dt test accuracy: 0.7194
dt test F1 (positive): 0.6961

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7000 Â± 0.0770
f1_positive       : 0.6226 Â± 0.0816
precision_positive: 0.6552 Â± 0.0771
recall_positive   : 0.6254 Â± 0.1787
f1_macro          : 0.6826 Â± 0.0684
Individual fold accuracies: ['0.5762', '0.7732', '0.6786', '0.7372', '0.7347']
Individual fold F1 (pos): ['0.5294', '0.5793', '0.5872', '0.7027', '0.7143']

XGB Results:
----------------------------------------
accuracy          : 0.7005 Â± 0.0940
f1_positive       : 0.6232 Â± 0.0927
precision_positive: 0.6615 Â± 0.0651
recall_positive   : 0.6210 Â± 0.1735
f1_macro          : 0.6837 Â± 0.0846
Individual fold accuracies: ['0.5497', '0.7955', '

[I 2025-09-01 22:15:27,063] Trial 0 finished with value: 0.556364577894247 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.556364577894247.
[I 2025-09-01 22:15:28,624] Trial 1 finished with value: 0.5739874847380184 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5739874847380184.
[I 2025-09-01 22:15:38,328] Trial 2 finished with value: 0.5444329683949597 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5739874847380184.
[I 2025-09-01 22:15:49,617] Trial 3 finished with value: 0.5512592365145186 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features'

Best rf params: {'n_estimators': 494, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.5784


[I 2025-09-01 22:18:32,563] A new study created in memory with name: no-name-c3976ccd-1b93-4e2b-a8a7-5457e025ef93


rf test accuracy: 0.7424
rf test F1 (positive): 0.7273

--- Optimizing XGB ---


[I 2025-09-01 22:18:36,086] Trial 0 finished with value: 0.546381973553231 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.546381973553231.
[I 2025-09-01 22:18:38,070] Trial 1 finished with value: 0.5519545382051992 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5519545382051992.
[I 2025-09-01 22:18:40,041] Trial 2 finished with value: 0.5397826030178972 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.65

Best xgb params: {'n_estimators': 146, 'max_depth': 4, 'learning_rate': 0.04323444823345436, 'subsample': 0.9577459972399921, 'colsample_bytree': 0.7182053332288235, 'min_child_weight': 6, 'gamma': 2.5338812843583347, 'reg_alpha': 1.3288245506198855, 'reg_lambda': 1.9699624612235909}
Best xgb F1 score (positive class): 0.5642


[I 2025-09-01 22:21:06,506] A new study created in memory with name: no-name-acd9bf89-fe42-4035-8333-7fd3741f9253
[I 2025-09-01 22:21:06,559] Trial 0 finished with value: 0.4773089144770561 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4773089144770561.


xgb test accuracy: 0.7036
xgb test F1 (positive): 0.6728

--- Optimizing DT ---


[I 2025-09-01 22:21:07,101] Trial 1 finished with value: 0.49569579350480547 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.49569579350480547.
[I 2025-09-01 22:21:07,150] Trial 2 finished with value: 0.5920354819846452 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5920354819846452.
[I 2025-09-01 22:21:07,180] Trial 3 finished with value: 0.6154540439257268 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6154540439257268.
[I 2025-09-01 22:21:07,207] Trial 4 finished with value: 0.6373822027573288 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'ma

Best dt params: {'criterion': 'entropy', 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 6, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6405
dt test accuracy: 0.7091
dt test F1 (positive): 0.7075

OUTER FOLD 2/5
Train size: 1861, Test size: 505
Class distribution in test set: {'non-void': np.int64(297), 'void': np.int64(208)}

--- Optimizing RF ---


[I 2025-09-01 22:21:11,492] Trial 0 finished with value: 0.6221924188579013 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6221924188579013.
[I 2025-09-01 22:21:12,978] Trial 1 finished with value: 0.6807363468110949 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6807363468110949.
[I 2025-09-01 22:21:21,777] Trial 2 finished with value: 0.5963631369594253 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6807363468110949.
[I 2025-09-01 22:21:31,860] Trial 3 finished with value: 0.5868169196617282 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 494, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6808


[I 2025-09-01 22:24:01,640] A new study created in memory with name: no-name-42315839-b6d0-469f-8033-afb9af5d220b


rf test accuracy: 0.6040
rf test F1 (positive): 0.5122

--- Optimizing XGB ---


[I 2025-09-01 22:24:04,779] Trial 0 finished with value: 0.5727192693988846 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5727192693988846.
[I 2025-09-01 22:24:06,680] Trial 1 finished with value: 0.5913582462593465 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5913582462593465.
[I 2025-09-01 22:24:08,478] Trial 2 finished with value: 0.5925758387822917 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 227, 'max_depth': 3, 'learning_rate': 0.01354211332106492, 'subsample': 0.6486562332328204, 'colsample_bytree': 0.6266755778334098, 'min_child_weight': 3, 'gamma': 3.371390927687933, 'reg_alpha': 0.4585345105947977, 'reg_lambda': 1.641620451128217}
Best xgb F1 score (positive class): 0.6176


[I 2025-09-01 22:26:10,514] A new study created in memory with name: no-name-d28d8740-a29b-4a7b-b142-8c83cb609967
[I 2025-09-01 22:26:10,561] Trial 0 finished with value: 0.5392074640668186 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5392074640668186.


xgb test accuracy: 0.5822
xgb test F1 (positive): 0.5104

--- Optimizing DT ---


[I 2025-09-01 22:26:11,033] Trial 1 finished with value: 0.5112073101315504 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5392074640668186.
[I 2025-09-01 22:26:11,081] Trial 2 finished with value: 0.6105137111368842 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6105137111368842.
[I 2025-09-01 22:26:11,112] Trial 3 finished with value: 0.6873187957465438 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6873187957465438.
[I 2025-09-01 22:26:11,139] Trial 4 finished with value: 0.681875047458786 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_f

Best dt params: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6873
dt test accuracy: 0.6059
dt test F1 (positive): 0.5739

OUTER FOLD 3/5
Train size: 1790, Test size: 576
Class distribution in test set: {'non-void': np.int64(335), 'void': np.int64(241)}

--- Optimizing RF ---


[I 2025-09-01 22:26:14,733] Trial 0 finished with value: 0.6113216836110197 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6113216836110197.
[I 2025-09-01 22:26:16,223] Trial 1 finished with value: 0.6508747930350718 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6508747930350718.
[I 2025-09-01 22:26:24,846] Trial 2 finished with value: 0.6066091268276703 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6508747930350718.
[I 2025-09-01 22:26:34,564] Trial 3 finished with value: 0.6121377467731183 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 272, 'max_depth': 4, 'min_samples_split': 13, 'min_samples_leaf': 9, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6560


[I 2025-09-01 22:29:48,773] A new study created in memory with name: no-name-7f70d78c-58c7-4967-b8e4-4d3b54a34e76


rf test accuracy: 0.6962
rf test F1 (positive): 0.6331

--- Optimizing XGB ---


[I 2025-09-01 22:29:51,700] Trial 0 finished with value: 0.5702890262253061 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5702890262253061.
[I 2025-09-01 22:29:53,643] Trial 1 finished with value: 0.5799409591278245 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5799409591278245.
[I 2025-09-01 22:29:55,322] Trial 2 finished with value: 0.5853588493308489 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 338, 'max_depth': 6, 'learning_rate': 0.08416899945837078, 'subsample': 0.990732927896814, 'colsample_bytree': 0.9084011427123242, 'min_child_weight': 10, 'gamma': 4.063596822468214, 'reg_alpha': 0.7253870931798736, 'reg_lambda': 1.6225258680005281}
Best xgb F1 score (positive class): 0.6243


[I 2025-09-01 22:32:29,915] A new study created in memory with name: no-name-a6342252-8923-4f11-8855-b51e54166001
[I 2025-09-01 22:32:29,962] Trial 0 finished with value: 0.5236065845384429 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5236065845384429.


xgb test accuracy: 0.6823
xgb test F1 (positive): 0.5924

--- Optimizing DT ---


[I 2025-09-01 22:32:30,474] Trial 1 finished with value: 0.5164898659146243 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5236065845384429.
[I 2025-09-01 22:32:30,517] Trial 2 finished with value: 0.6391166708504169 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6391166708504169.
[I 2025-09-01 22:32:30,547] Trial 3 finished with value: 0.6013585950936277 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6391166708504169.
[I 2025-09-01 22:32:30,573] Trial 4 finished with value: 0.4198995447474183 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6775
dt test accuracy: 0.6649
dt test F1 (positive): 0.6252

OUTER FOLD 4/5
Train size: 1999, Test size: 367
Class distribution in test set: {'non-void': np.int64(237), 'void': np.int64(130)}

--- Optimizing RF ---


[I 2025-09-01 22:32:33,903] Trial 0 finished with value: 0.5806496317125874 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5806496317125874.
[I 2025-09-01 22:32:35,501] Trial 1 finished with value: 0.5957078851002237 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5957078851002237.
[I 2025-09-01 22:32:45,344] Trial 2 finished with value: 0.6028720264192021 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 2 with value: 0.6028720264192021.
[I 2025-09-01 22:32:56,783] Trial 3 finished with value: 0.6007972557868174 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 407, 'max_depth': 3, 'min_samples_split': 19, 'min_samples_leaf': 5, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6325


[I 2025-09-01 22:40:02,654] A new study created in memory with name: no-name-75fe41f1-82fb-4ae1-add1-b32727502963


rf test accuracy: 0.7629
rf test F1 (positive): 0.6947

--- Optimizing XGB ---


[I 2025-09-01 22:40:06,133] Trial 0 finished with value: 0.5678537860401588 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5678537860401588.
[I 2025-09-01 22:40:08,444] Trial 1 finished with value: 0.5756377505482747 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5756377505482747.
[I 2025-09-01 22:40:10,349] Trial 2 finished with value: 0.5820666841501057 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 468, 'max_depth': 6, 'learning_rate': 0.012150726268889755, 'subsample': 0.7771242812353383, 'colsample_bytree': 0.9117536135814382, 'min_child_weight': 7, 'gamma': 4.971509633507085, 'reg_alpha': 1.7988274148811394, 'reg_lambda': 1.7062436610349576}
Best xgb F1 score (positive class): 0.6092


[I 2025-09-01 22:43:52,160] A new study created in memory with name: no-name-1b5dadf4-112f-44a8-a6da-42239abae83d
[I 2025-09-01 22:43:52,211] Trial 0 finished with value: 0.5232373007682605 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5232373007682605.


xgb test accuracy: 0.7684
xgb test F1 (positive): 0.6792

--- Optimizing DT ---


[I 2025-09-01 22:43:52,751] Trial 1 finished with value: 0.512213326545574 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5232373007682605.
[I 2025-09-01 22:43:52,799] Trial 2 finished with value: 0.5335095896094048 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5335095896094048.
[I 2025-09-01 22:43:52,830] Trial 3 finished with value: 0.48159457250111526 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5335095896094048.
[I 2025-09-01 22:43:52,857] Trial 4 finished with value: 0.5702897791999884 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6521
dt test accuracy: 0.7548
dt test F1 (positive): 0.6918

OUTER FOLD 5/5
Train size: 1809, Test size: 557
Class distribution in test set: {'non-void': np.int64(362), 'void': np.int64(195)}

--- Optimizing RF ---


[I 2025-09-01 22:43:56,852] Trial 0 finished with value: 0.5888788306264034 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5888788306264034.
[I 2025-09-01 22:43:58,459] Trial 1 finished with value: 0.6178482942633886 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6178482942633886.
[I 2025-09-01 22:44:07,603] Trial 2 finished with value: 0.5991512046414007 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6178482942633886.
[I 2025-09-01 22:44:17,842] Trial 3 finished with value: 0.5970409413411958 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 214, 'max_depth': 3, 'min_samples_split': 12, 'min_samples_leaf': 4, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6532


[I 2025-09-01 22:48:15,015] A new study created in memory with name: no-name-b342e43f-428f-418e-932c-5da1094fd72a


rf test accuracy: 0.7594
rf test F1 (positive): 0.6884

--- Optimizing XGB ---


[I 2025-09-01 22:48:18,429] Trial 0 finished with value: 0.5806198569173809 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5806198569173809.
[I 2025-09-01 22:48:20,886] Trial 1 finished with value: 0.5766697435060201 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5806198569173809.
[I 2025-09-01 22:48:22,635] Trial 2 finished with value: 0.5777400467675651 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 467, 'max_depth': 10, 'learning_rate': 0.012219811160283485, 'subsample': 0.7218520073542559, 'colsample_bytree': 0.7705413902968903, 'min_child_weight': 2, 'gamma': 4.6041885418822, 'reg_alpha': 1.9949396569619464, 'reg_lambda': 1.245098664363596}
Best xgb F1 score (positive class): 0.6221


[I 2025-09-01 22:51:09,189] A new study created in memory with name: no-name-89c553b6-57fe-41e6-b400-91924f8f8401
[I 2025-09-01 22:51:09,235] Trial 0 finished with value: 0.5166803819376412 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5166803819376412.


xgb test accuracy: 0.7792
xgb test F1 (positive): 0.6917

--- Optimizing DT ---


[I 2025-09-01 22:51:09,731] Trial 1 finished with value: 0.5266061043664187 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5266061043664187.
[I 2025-09-01 22:51:09,776] Trial 2 finished with value: 0.5915868540536975 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5915868540536975.
[I 2025-09-01 22:51:09,805] Trial 3 finished with value: 0.6182382296867174 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6182382296867174.
[I 2025-09-01 22:51:09,831] Trial 4 finished with value: 0.6553129002916839 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 16, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6684
dt test accuracy: 0.7540
dt test F1 (positive): 0.6935

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7130 Â± 0.0665
f1_positive       : 0.6511 Â± 0.0847
precision_positive: 0.6426 Â± 0.0942
recall_positive   : 0.6659 Â± 0.1066
f1_macro          : 0.7029 Â± 0.0685
Individual fold accuracies: ['0.7424', '0.6040', '0.6962', '0.7629', '0.7594']
Individual fold F1 (pos): ['0.7273', '0.5122', '0.6331', '0.6947', '0.6884']

XGB Results:
----------------------------------------
accuracy          : 0.7031 Â± 0.0792
f1_positive       : 0.6293 Â± 0.0771
precision_positive: 0.6479 Â± 0.0982
recall_positive   : 0.6164 Â± 0.0809
f1_macro          : 0.6898 Â± 0.0754
Individual fold accuracies: ['0.7036', '0.5822', '

[I 2025-09-01 22:51:15,797] A new study created in memory with name: no-name-6e8b46d6-c4dc-49cb-b235-963c2d4708f9



OUTER FOLD 1/5
Train size: 4891, Test size: 936
Class distribution in test set: {'non-void': np.int64(545), 'void': np.int64(391)}

--- Optimizing RF ---


[I 2025-09-01 22:51:18,382] Trial 0 finished with value: 0.6293173892834716 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6293173892834716.
[I 2025-09-01 22:51:21,109] Trial 1 finished with value: 0.6553459504493552 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6553459504493552.
[I 2025-09-01 22:51:47,105] Trial 2 finished with value: 0.6041458250301533 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6553459504493552.
[I 2025-09-01 22:52:21,040] Trial 3 finished with value: 0.5812519867548165 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 368, 'max_depth': 4, 'min_samples_split': 10, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6592


[I 2025-09-01 22:58:42,614] A new study created in memory with name: no-name-069efe49-c8ee-4ae9-85ad-17ecf216b253


rf test accuracy: 0.6068
rf test F1 (positive): 0.5040

--- Optimizing XGB ---


[I 2025-09-01 22:58:48,133] Trial 0 finished with value: 0.5620910200860618 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5620910200860618.
[I 2025-09-01 22:58:51,047] Trial 1 finished with value: 0.5544534705487901 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5620910200860618.
[I 2025-09-01 22:58:53,938] Trial 2 finished with value: 0.553330176564328 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.6

Best xgb params: {'n_estimators': 180, 'max_depth': 3, 'learning_rate': 0.01602665567338633, 'subsample': 0.7045562334691738, 'colsample_bytree': 0.6571668560147156, 'min_child_weight': 9, 'gamma': 0.11614066779852206, 'reg_alpha': 1.941389610975628, 'reg_lambda': 0.3073507478757792}
Best xgb F1 score (positive class): 0.6387


[I 2025-09-01 23:02:58,268] A new study created in memory with name: no-name-3cb112fe-774c-4aec-9be4-cfdcc362c6f2
[I 2025-09-01 23:02:58,364] Trial 0 finished with value: 0.5450394992668574 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5450394992668574.


xgb test accuracy: 0.6015
xgb test F1 (positive): 0.5187

--- Optimizing DT ---


[I 2025-09-01 23:02:59,837] Trial 1 finished with value: 0.518974769456921 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5450394992668574.
[I 2025-09-01 23:02:59,934] Trial 2 finished with value: 0.6147430539769602 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6147430539769602.
[I 2025-09-01 23:02:59,988] Trial 3 finished with value: 0.6112420144853714 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6147430539769602.
[I 2025-09-01 23:03:00,034] Trial 4 finished with value: 0.6292098737657109 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_f

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 5, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6389
dt test accuracy: 0.6506
dt test F1 (positive): 0.5948

OUTER FOLD 2/5
Train size: 4413, Test size: 1414
Class distribution in test set: {'non-void': np.int64(770), 'void': np.int64(644)}

--- Optimizing RF ---


[I 2025-09-01 23:03:07,499] Trial 0 finished with value: 0.6101516786148978 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6101516786148978.
[I 2025-09-01 23:03:10,153] Trial 1 finished with value: 0.636161466787917 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.636161466787917.
[I 2025-09-01 23:03:33,885] Trial 2 finished with value: 0.6132740069452531 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.636161466787917.
[I 2025-09-01 23:04:05,103] Trial 3 finished with value: 0.5980730528860723 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features':

Best rf params: {'n_estimators': 380, 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 5, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6797


[I 2025-09-01 23:15:58,030] A new study created in memory with name: no-name-5ae221cb-af90-48e2-86de-3bfb61809088


rf test accuracy: 0.6351
rf test F1 (positive): 0.6569

--- Optimizing XGB ---


[I 2025-09-01 23:16:02,973] Trial 0 finished with value: 0.5940478334069962 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5940478334069962.
[I 2025-09-01 23:16:05,556] Trial 1 finished with value: 0.5838896290464404 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5940478334069962.
[I 2025-09-01 23:16:08,357] Trial 2 finished with value: 0.59849965535115 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.65

Best xgb params: {'n_estimators': 358, 'max_depth': 3, 'learning_rate': 0.01027383898668611, 'subsample': 0.7001689852647316, 'colsample_bytree': 0.9374041860940409, 'min_child_weight': 2, 'gamma': 2.420567028593851, 'reg_alpha': 0.6616579190221874, 'reg_lambda': 1.2806309176921558}
Best xgb F1 score (positive class): 0.6405


[I 2025-09-01 23:20:20,536] A new study created in memory with name: no-name-b52b9804-3eb2-4e28-be5a-eefd0145c480
[I 2025-09-01 23:20:20,621] Trial 0 finished with value: 0.5145162724856699 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5145162724856699.


xgb test accuracy: 0.6513
xgb test F1 (positive): 0.6290

--- Optimizing DT ---


[I 2025-09-01 23:20:21,969] Trial 1 finished with value: 0.5056374100493523 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5145162724856699.
[I 2025-09-01 23:20:22,057] Trial 2 finished with value: 0.6215390137916005 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6215390137916005.
[I 2025-09-01 23:20:22,106] Trial 3 finished with value: 0.6652480809724332 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6652480809724332.
[I 2025-09-01 23:20:22,147] Trial 4 finished with value: 0.6601719048175775 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6815
dt test accuracy: 0.6195
dt test F1 (positive): 0.6061

OUTER FOLD 3/5
Train size: 4745, Test size: 1082
Class distribution in test set: {'non-void': np.int64(556), 'void': np.int64(526)}

--- Optimizing RF ---


[I 2025-09-01 23:20:29,558] Trial 0 finished with value: 0.5490808962821979 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5490808962821979.
[I 2025-09-01 23:20:32,257] Trial 1 finished with value: 0.5814910563908158 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5814910563908158.
[I 2025-09-01 23:20:57,294] Trial 2 finished with value: 0.5731882609471549 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5814910563908158.
[I 2025-09-01 23:21:29,905] Trial 3 finished with value: 0.5632495227815424 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 494, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.5852


[I 2025-09-01 23:27:28,640] A new study created in memory with name: no-name-f42ce6ee-e643-4075-854f-1382c4242b5d


rf test accuracy: 0.7579
rf test F1 (positive): 0.7277

--- Optimizing XGB ---


[I 2025-09-01 23:27:33,942] Trial 0 finished with value: 0.5382351544652355 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5382351544652355.
[I 2025-09-01 23:27:36,698] Trial 1 finished with value: 0.5274199498073017 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5382351544652355.
[I 2025-09-01 23:27:39,806] Trial 2 finished with value: 0.5489890731527286 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 401, 'max_depth': 8, 'learning_rate': 0.019929485293110217, 'subsample': 0.9165361913165876, 'colsample_bytree': 0.7881312976766603, 'min_child_weight': 9, 'gamma': 4.753544988276152, 'reg_alpha': 0.7254592099636309, 'reg_lambda': 1.3350419570831598}
Best xgb F1 score (positive class): 0.5715


[I 2025-09-01 23:33:15,867] A new study created in memory with name: no-name-f52ea377-daf1-467a-a3b5-102c3757a8a5
[I 2025-09-01 23:33:15,959] Trial 0 finished with value: 0.5141560547775095 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5141560547775095.


xgb test accuracy: 0.6590
xgb test F1 (positive): 0.5877

--- Optimizing DT ---


[I 2025-09-01 23:33:17,461] Trial 1 finished with value: 0.4889710674905314 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5141560547775095.
[I 2025-09-01 23:33:17,555] Trial 2 finished with value: 0.552365261217359 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.552365261217359.
[I 2025-09-01 23:33:17,607] Trial 3 finished with value: 0.5599946277705042 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.5599946277705042.
[I 2025-09-01 23:33:17,650] Trial 4 finished with value: 0.6461679540321791 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_fe

Best dt params: {'criterion': 'entropy', 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 10, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6526
dt test accuracy: 0.7597
dt test F1 (positive): 0.7619

OUTER FOLD 4/5
Train size: 4865, Test size: 962
Class distribution in test set: {'non-void': np.int64(508), 'void': np.int64(454)}

--- Optimizing RF ---


[I 2025-09-01 23:33:26,318] Trial 0 finished with value: 0.5669977924679213 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5669977924679213.
[I 2025-09-01 23:33:28,998] Trial 1 finished with value: 0.6217739621776094 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6217739621776094.
[I 2025-09-01 23:33:54,039] Trial 2 finished with value: 0.5962615673953835 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6217739621776094.
[I 2025-09-01 23:34:27,508] Trial 3 finished with value: 0.5775884409545139 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 276, 'max_depth': 3, 'min_samples_split': 15, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6245


[I 2025-09-01 23:39:47,511] A new study created in memory with name: no-name-4c50c9cf-82de-4d36-938c-eb17ef486b32


rf test accuracy: 0.7505
rf test F1 (positive): 0.7248

--- Optimizing XGB ---


[I 2025-09-01 23:39:53,153] Trial 0 finished with value: 0.5687213569638382 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5687213569638382.
[I 2025-09-01 23:39:55,910] Trial 1 finished with value: 0.5423236763582328 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5687213569638382.
[I 2025-09-01 23:39:58,664] Trial 2 finished with value: 0.552893760320499 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.6

Best xgb params: {'n_estimators': 84, 'max_depth': 3, 'learning_rate': 0.039173194051155505, 'subsample': 0.8528449636166299, 'colsample_bytree': 0.8754006721464518, 'min_child_weight': 2, 'gamma': 0.6155467087603368, 'reg_alpha': 0.410669417840048, 'reg_lambda': 0.5732501707247072}
Best xgb F1 score (positive class): 0.6264


[I 2025-09-01 23:42:24,980] A new study created in memory with name: no-name-f6c29cce-6e9b-41e8-a1b8-8abe573da36a
[I 2025-09-01 23:42:25,074] Trial 0 finished with value: 0.5573866472718163 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5573866472718163.


xgb test accuracy: 0.7360
xgb test F1 (positive): 0.6998

--- Optimizing DT ---


[I 2025-09-01 23:42:26,540] Trial 1 finished with value: 0.49748612739706255 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5573866472718163.
[I 2025-09-01 23:42:26,638] Trial 2 finished with value: 0.5900346065460175 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5900346065460175.
[I 2025-09-01 23:42:26,692] Trial 3 finished with value: 0.6389323581753655 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6389323581753655.
[I 2025-09-01 23:42:26,736] Trial 4 finished with value: 0.6569614266487399 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max

Best dt params: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6570
dt test accuracy: 0.7214
dt test F1 (positive): 0.6763

OUTER FOLD 5/5
Train size: 4394, Test size: 1433
Class distribution in test set: {'non-void': np.int64(1059), 'void': np.int64(374)}

--- Optimizing RF ---


[I 2025-09-01 23:42:36,424] Trial 0 finished with value: 0.6216701558065746 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6216701558065746.
[I 2025-09-01 23:42:39,010] Trial 1 finished with value: 0.631839824677703 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.631839824677703.
[I 2025-09-01 23:43:03,109] Trial 2 finished with value: 0.6370768153937271 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 2 with value: 0.6370768153937271.
[I 2025-09-01 23:43:34,668] Trial 3 finished with value: 0.6315587518078997 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features'

Best rf params: {'n_estimators': 60, 'max_depth': 5, 'min_samples_split': 18, 'min_samples_leaf': 5, 'max_features': 'log2', 'bootstrap': True}
Best rf F1 score (positive class): 0.6469
rf test accuracy: 0.7962
rf test F1 (positive): 0.6524

--- Optimizing XGB ---


[I 2025-09-01 23:48:58,929] Trial 0 finished with value: 0.596049077108741 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.596049077108741.
[I 2025-09-01 23:49:02,551] Trial 1 finished with value: 0.593198837397409 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.596049077108741.
[I 2025-09-01 23:49:05,916] Trial 2 finished with value: 0.5887899805876219 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.6557

Best xgb params: {'n_estimators': 430, 'max_depth': 3, 'learning_rate': 0.013311477933563892, 'subsample': 0.9102397600868964, 'colsample_bytree': 0.6610248354839828, 'min_child_weight': 9, 'gamma': 1.0317634644804474, 'reg_alpha': 0.47249014449227733, 'reg_lambda': 0.9356853227116683}
Best xgb F1 score (positive class): 0.6495


[I 2025-09-01 23:54:11,628] A new study created in memory with name: no-name-55b72877-533c-4bea-b1d4-33b4d28c4c76
[I 2025-09-01 23:54:11,718] Trial 0 finished with value: 0.523579882320112 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.523579882320112.


xgb test accuracy: 0.7872
xgb test F1 (positive): 0.6276

--- Optimizing DT ---


[I 2025-09-01 23:54:13,004] Trial 1 finished with value: 0.5302766643099255 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5302766643099255.
[I 2025-09-01 23:54:13,104] Trial 2 finished with value: 0.6217323608852742 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6217323608852742.
[I 2025-09-01 23:54:13,155] Trial 3 finished with value: 0.5854491015848303 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6217323608852742.
[I 2025-09-01 23:54:13,195] Trial 4 finished with value: 0.6769497968484383 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6769
dt test accuracy: 0.7634
dt test F1 (positive): 0.6405

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7093 Â± 0.0831
f1_positive       : 0.6532 Â± 0.0907
precision_positive: 0.6508 Â± 0.1203
recall_positive   : 0.6679 Â± 0.1127
f1_macro          : 0.6960 Â± 0.0789
Individual fold accuracies: ['0.6068', '0.6351', '0.7579', '0.7505', '0.7962']
Individual fold F1 (pos): ['0.5040', '0.6569', '0.7277', '0.7248', '0.6524']

XGB Results:
----------------------------------------
accuracy          : 0.6870 Â± 0.0738
f1_positive       : 0.6126 Â± 0.0662
precision_positive: 0.6358 Â± 0.0960
recall_positive   : 0.6005 Â± 0.0867
f1_macro          : 0.6719 Â± 0.0633
Individual fold accuracies: ['0.6015', '0.6513',

[I 2025-09-01 23:54:20,457] Trial 0 finished with value: 0.6306919708096957 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6306919708096957.
[I 2025-09-01 23:54:21,433] Trial 1 finished with value: 0.6395072965786358 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6395072965786358.
[I 2025-09-01 23:54:24,209] Trial 2 finished with value: 0.6083516483516483 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6395072965786358.
[I 2025-09-01 23:54:26,754] Trial 3 finished with value: 0.628612785064398 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 238, 'max_depth': 4, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_features': 'log2', 'bootstrap': False}
Best rf F1 score (positive class): 0.6518


[I 2025-09-01 23:55:22,676] A new study created in memory with name: no-name-bc2eb33b-2ae0-446c-8084-563a6e65dc6b


rf test accuracy: 0.7485
rf test F1 (positive): 0.5981

--- Optimizing XGB ---


[I 2025-09-01 23:55:24,389] Trial 0 finished with value: 0.5919376512157432 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5919376512157432.
[I 2025-09-01 23:55:26,551] Trial 1 finished with value: 0.6134367256259079 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.6134367256259079.
[I 2025-09-01 23:55:27,899] Trial 2 finished with value: 0.6182358698959008 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 281, 'max_depth': 8, 'learning_rate': 0.011711509955524094, 'subsample': 0.8430179407605753, 'colsample_bytree': 0.6682096494749166, 'min_child_weight': 1, 'gamma': 4.7444276862666666, 'reg_alpha': 1.9312640661491187, 'reg_lambda': 1.6167946962329223}
Best xgb F1 score (positive class): 0.6391


[I 2025-09-01 23:56:55,426] A new study created in memory with name: no-name-98c66323-06c2-4693-b5f8-adf8678ac16e
[I 2025-09-01 23:56:55,453] Trial 0 finished with value: 0.6187010107181169 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.6187010107181169.
[I 2025-09-01 23:56:55,600] Trial 1 finished with value: 0.5758929080405293 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.6187010107181169.
[I 2025-09-01 23:56:55,625] Trial 2 finished with value: 0.5997935105909894 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.6187010107181169.


xgb test accuracy: 0.7427
xgb test F1 (positive): 0.5600

--- Optimizing DT ---


[I 2025-09-01 23:56:55,647] Trial 3 finished with value: 0.6127077223851417 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.6187010107181169.
[I 2025-09-01 23:56:55,669] Trial 4 finished with value: 0.6336260187919264 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 4 with value: 0.6336260187919264.
[I 2025-09-01 23:56:55,689] Trial 5 finished with value: 0.6032595609033197 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'splitter': 'random'}. Best is trial 4 with value: 0.6336260187919264.
[I 2025-09-01 23:56:55,716] Trial 6 finished with value: 0.583185805659518 and parameters: {'criterion': 'gini', 'max_depth': 17, 'min_samples_split': 8, 'min_samples_leaf': 3, 'ma

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6621
dt test accuracy: 0.7076
dt test F1 (positive): 0.5833

OUTER FOLD 2/5
Train size: 627, Test size: 162
Class distribution in test set: {'non-void': np.int64(107), 'void': np.int64(55)}

--- Optimizing RF ---


[I 2025-09-01 23:56:58,050] Trial 0 finished with value: 0.7027274223624347 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.7027274223624347.
[I 2025-09-01 23:56:59,004] Trial 1 finished with value: 0.7023439425722752 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 0 with value: 0.7027274223624347.
[I 2025-09-01 23:57:01,719] Trial 2 finished with value: 0.6864426063945387 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 0 with value: 0.7027274223624347.
[I 2025-09-01 23:57:04,241] Trial 3 finished with value: 0.7012701789819938 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 170, 'max_depth': 20, 'min_samples_split': 10, 'min_samples_leaf': 2, 'max_features': 'log2', 'bootstrap': True}
Best rf F1 score (positive class): 0.7147


[I 2025-09-01 23:58:04,775] A new study created in memory with name: no-name-fcbdee7c-5791-4a40-80f4-8bcfb4adfff3


rf test accuracy: 0.6420
rf test F1 (positive): 0.5606

--- Optimizing XGB ---


[I 2025-09-01 23:58:06,666] Trial 0 finished with value: 0.6797554074241358 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6797554074241358.
[I 2025-09-01 23:58:08,225] Trial 1 finished with value: 0.6460552916818901 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6797554074241358.
[I 2025-09-01 23:58:09,612] Trial 2 finished with value: 0.6710849550152869 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 220, 'max_depth': 4, 'learning_rate': 0.01490480262138383, 'subsample': 0.8429869347789518, 'colsample_bytree': 0.6425899051092601, 'min_child_weight': 2, 'gamma': 3.9789018179273223, 'reg_alpha': 1.6575862542719724, 'reg_lambda': 0.1699716371289243}
Best xgb F1 score (positive class): 0.7152


[I 2025-09-01 23:59:28,549] A new study created in memory with name: no-name-436b86bb-0375-4155-bcde-cd498eeb04e6
[I 2025-09-01 23:59:28,579] Trial 0 finished with value: 0.5900871058765795 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5900871058765795.
[I 2025-09-01 23:59:28,729] Trial 1 finished with value: 0.5817318546337759 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5900871058765795.


xgb test accuracy: 0.6543
xgb test F1 (positive): 0.5821

--- Optimizing DT ---


[I 2025-09-01 23:59:28,754] Trial 2 finished with value: 0.5993110127945162 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5993110127945162.
[I 2025-09-01 23:59:28,775] Trial 3 finished with value: 0.7059911929091487 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.7059911929091487.
[I 2025-09-01 23:59:28,796] Trial 4 finished with value: 0.6902696182314689 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.7059911929091487.
[I 2025-09-01 23:59:28,815] Trial 5 finished with value: 0.6115768463073853 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 4, 'min_samples_split': 6, 'min_samples_leaf': 1, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.7232
dt test accuracy: 0.6296
dt test F1 (positive): 0.6000

OUTER FOLD 3/5
Train size: 653, Test size: 136
Class distribution in test set: {'non-void': np.int64(79), 'void': np.int64(57)}

--- Optimizing RF ---


[I 2025-09-01 23:59:31,339] Trial 0 finished with value: 0.5864560377182086 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5864560377182086.
[I 2025-09-01 23:59:32,340] Trial 1 finished with value: 0.572241655832987 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 0 with value: 0.5864560377182086.
[I 2025-09-01 23:59:35,300] Trial 2 finished with value: 0.612064947260478 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 2 with value: 0.612064947260478.
[I 2025-09-01 23:59:38,034] Trial 3 finished with value: 0.6122065889954713 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features':

Best rf params: {'n_estimators': 116, 'max_depth': 3, 'min_samples_split': 11, 'min_samples_leaf': 10, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6444


[I 2025-09-02 00:01:10,677] A new study created in memory with name: no-name-9b6988a6-ba68-4bd1-af47-4dd343d763ce


rf test accuracy: 0.7941
rf test F1 (positive): 0.7742

--- Optimizing XGB ---


[I 2025-09-02 00:01:12,442] Trial 0 finished with value: 0.5325658551380393 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5325658551380393.
[I 2025-09-02 00:01:13,957] Trial 1 finished with value: 0.573682625715146 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.573682625715146.
[I 2025-09-02 00:01:15,362] Trial 2 finished with value: 0.5685520445605977 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.65

Best xgb params: {'n_estimators': 397, 'max_depth': 11, 'learning_rate': 0.013722315372926532, 'subsample': 0.6518394607057804, 'colsample_bytree': 0.8396100645838735, 'min_child_weight': 8, 'gamma': 4.9839999699394335, 'reg_alpha': 1.8101679144546727, 'reg_lambda': 0.5811072779217145}
Best xgb F1 score (positive class): 0.6052


[I 2025-09-02 00:02:40,954] A new study created in memory with name: no-name-3de1c2e2-8df2-4f9a-afc2-78a5e8bd2b66
[I 2025-09-02 00:02:40,983] Trial 0 finished with value: 0.526108568303639 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.526108568303639.
[I 2025-09-02 00:02:41,148] Trial 1 finished with value: 0.5575606625802852 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5575606625802852.


xgb test accuracy: 0.8015
xgb test F1 (positive): 0.7731

--- Optimizing DT ---


[I 2025-09-02 00:02:41,173] Trial 2 finished with value: 0.5121678911085392 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5575606625802852.
[I 2025-09-02 00:02:41,195] Trial 3 finished with value: 0.5314026669448356 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5575606625802852.
[I 2025-09-02 00:02:41,215] Trial 4 finished with value: 0.5968898608073866 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 4 with value: 0.5968898608073866.
[I 2025-09-02 00:02:41,234] Trial 5 finished with value: 0.46406653746770027 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 11, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6654
dt test accuracy: 0.7794
dt test F1 (positive): 0.7619

OUTER FOLD 4/5
Train size: 615, Test size: 174
Class distribution in test set: {'non-void': np.int64(100), 'void': np.int64(74)}

--- Optimizing RF ---


[I 2025-09-02 00:02:44,784] Trial 0 finished with value: 0.614021164021164 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.614021164021164.
[I 2025-09-02 00:02:45,760] Trial 1 finished with value: 0.6344933202997719 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6344933202997719.
[I 2025-09-02 00:02:48,424] Trial 2 finished with value: 0.6180005212558676 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6344933202997719.
[I 2025-09-02 00:02:50,795] Trial 3 finished with value: 0.606097854126528 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features':

Best rf params: {'n_estimators': 126, 'max_depth': 5, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': 'log2', 'bootstrap': False}
Best rf F1 score (positive class): 0.6431
rf test accuracy: 0.7241
rf test F1 (positive): 0.6883

--- Optimizing XGB ---


[I 2025-09-02 00:03:37,975] Trial 0 finished with value: 0.5523510971786835 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5523510971786835.
[I 2025-09-02 00:03:39,449] Trial 1 finished with value: 0.5503687836933923 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5523510971786835.
[I 2025-09-02 00:03:40,628] Trial 2 finished with value: 0.5930112278845513 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 467, 'max_depth': 4, 'learning_rate': 0.010605682997532787, 'subsample': 0.6359197517401444, 'colsample_bytree': 0.6076295758343705, 'min_child_weight': 10, 'gamma': 3.7515598807230637, 'reg_alpha': 1.630262725233122, 'reg_lambda': 1.6080855663491742}
Best xgb F1 score (positive class): 0.6237


[I 2025-09-02 00:05:12,535] A new study created in memory with name: no-name-f4a30d80-cc0f-4599-a2b4-3f6c7031fde2
[I 2025-09-02 00:05:12,564] Trial 0 finished with value: 0.5117362838436686 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5117362838436686.
[I 2025-09-02 00:05:12,703] Trial 1 finished with value: 0.5060001597810139 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5117362838436686.
[I 2025-09-02 00:05:12,727] Trial 2 finished with value: 0.6235717356778717 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6235717356778717.


xgb test accuracy: 0.7529
xgb test F1 (positive): 0.7261

--- Optimizing DT ---


[I 2025-09-02 00:05:12,748] Trial 3 finished with value: 0.551856821102932 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6235717356778717.
[I 2025-09-02 00:05:12,771] Trial 4 finished with value: 0.6452109274444301 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 4 with value: 0.6452109274444301.
[I 2025-09-02 00:05:12,791] Trial 5 finished with value: 0.5474080003989666 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'splitter': 'random'}. Best is trial 4 with value: 0.6452109274444301.
[I 2025-09-02 00:05:12,817] Trial 6 finished with value: 0.5170616622355156 and parameters: {'criterion': 'gini', 'max_depth': 17, 'min_samples_split': 8, 'min_samples_leaf': 3, 'ma

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 5, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6644
dt test accuracy: 0.7299
dt test F1 (positive): 0.7152

OUTER FOLD 5/5
Train size: 643, Test size: 146
Class distribution in test set: {'non-void': np.int64(69), 'void': np.int64(77)}

--- Optimizing RF ---


[I 2025-09-02 00:05:15,051] Trial 0 finished with value: 0.6026552868658132 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6026552868658132.
[I 2025-09-02 00:05:16,063] Trial 1 finished with value: 0.6218956482114376 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6218956482114376.
[I 2025-09-02 00:05:18,972] Trial 2 finished with value: 0.5970001361099768 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6218956482114376.
[I 2025-09-02 00:05:21,719] Trial 3 finished with value: 0.5959987459667015 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 378, 'max_depth': 3, 'min_samples_split': 18, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6263


[I 2025-09-02 00:06:27,331] A new study created in memory with name: no-name-8433f8e2-9e4d-4e87-96dd-ec27e181d431


rf test accuracy: 0.6918
rf test F1 (positive): 0.6667

--- Optimizing XGB ---


[I 2025-09-02 00:06:29,157] Trial 0 finished with value: 0.5275432201536004 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5275432201536004.
[I 2025-09-02 00:06:30,616] Trial 1 finished with value: 0.549648382559775 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.549648382559775.
[I 2025-09-02 00:06:31,925] Trial 2 finished with value: 0.6006606226720079 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.65

Best xgb params: {'n_estimators': 422, 'max_depth': 6, 'learning_rate': 0.013722315372926532, 'subsample': 0.7713117135047077, 'colsample_bytree': 0.740371877443526, 'min_child_weight': 3, 'gamma': 4.980236776874211, 'reg_alpha': 0.8198179033349909, 'reg_lambda': 1.3026296376062052}
Best xgb F1 score (positive class): 0.6183


[I 2025-09-02 00:07:59,782] A new study created in memory with name: no-name-5eb69436-6e4e-42d9-a210-be7eeaf86513
[I 2025-09-02 00:07:59,809] Trial 0 finished with value: 0.5418793444331772 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5418793444331772.
[I 2025-09-02 00:07:59,964] Trial 1 finished with value: 0.5792940509610475 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5792940509610475.


xgb test accuracy: 0.6849
xgb test F1 (positive): 0.6567

--- Optimizing DT ---


[I 2025-09-02 00:07:59,994] Trial 2 finished with value: 0.564263671551121 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5792940509610475.
[I 2025-09-02 00:08:00,019] Trial 3 finished with value: 0.5844384707287933 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.5844384707287933.
[I 2025-09-02 00:08:00,039] Trial 4 finished with value: 0.6179152348224513 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 4 with value: 0.6179152348224513.
[I 2025-09-02 00:08:00,056] Trial 5 finished with value: 0.5367063351186125 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_f

Best dt params: {'criterion': 'entropy', 'max_depth': 4, 'min_samples_split': 12, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6749
dt test accuracy: 0.6507
dt test F1 (positive): 0.6047

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7201 Â± 0.0575
f1_positive       : 0.6576 Â± 0.0830
precision_positive: 0.6632 Â± 0.1109
recall_positive   : 0.6698 Â± 0.1202
f1_macro          : 0.7080 Â± 0.0588
Individual fold accuracies: ['0.7485', '0.6420', '0.7941', '0.7241', '0.6918']
Individual fold F1 (pos): ['0.5981', '0.5606', '0.7742', '0.6883', '0.6667']

XGB Results:
----------------------------------------
accuracy          : 0.7273 Â± 0.0581
f1_positive       : 0.6596 Â± 0.0912
precision_positive: 0.6789 Â± 0.1089
recall_positive   : 0.6649 Â± 0.1426
f1_macro          : 0.7129 Â± 0.0612
Individual fold accuracies: ['0.7427', '0.6543', '

[I 2025-09-02 00:08:04,500] Trial 0 finished with value: 0.6300620014302704 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6300620014302704.
[I 2025-09-02 00:08:05,773] Trial 1 finished with value: 0.6532806374911638 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6532806374911638.
[I 2025-09-02 00:08:11,899] Trial 2 finished with value: 0.654888527005172 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 2 with value: 0.654888527005172.
[I 2025-09-02 00:08:18,455] Trial 3 finished with value: 0.6483924506373594 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features'

Best rf params: {'n_estimators': 447, 'max_depth': 3, 'min_samples_split': 9, 'min_samples_leaf': 7, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6910


[I 2025-09-02 00:13:09,656] A new study created in memory with name: no-name-c8a6ae8a-8d62-4c7d-9f86-691c25ec57bf


rf test accuracy: 0.5270
rf test F1 (positive): 0.4878

--- Optimizing XGB ---


[I 2025-09-02 00:13:12,422] Trial 0 finished with value: 0.5977757687533843 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5977757687533843.
[I 2025-09-02 00:13:14,207] Trial 1 finished with value: 0.60802813869201 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.60802813869201.
[I 2025-09-02 00:13:15,770] Trial 2 finished with value: 0.5942173884096531 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.6557

Best xgb params: {'n_estimators': 161, 'max_depth': 11, 'learning_rate': 0.051536500549364414, 'subsample': 0.8310728434128972, 'colsample_bytree': 0.9636703693123553, 'min_child_weight': 4, 'gamma': 2.9870313353299833, 'reg_alpha': 1.9148024888438644, 'reg_lambda': 0.8294134059272851}
Best xgb F1 score (positive class): 0.6316


[I 2025-09-02 00:15:22,310] A new study created in memory with name: no-name-7b30ba38-38b1-4b70-a5ee-8f9d61b9e3d2
[I 2025-09-02 00:15:22,351] Trial 0 finished with value: 0.4948139561465692 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4948139561465692.


xgb test accuracy: 0.4910
xgb test F1 (positive): 0.3957

--- Optimizing DT ---


[I 2025-09-02 00:15:22,673] Trial 1 finished with value: 0.5287455673758865 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5287455673758865.
[I 2025-09-02 00:15:22,710] Trial 2 finished with value: 0.5860085059951147 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5860085059951147.
[I 2025-09-02 00:15:22,736] Trial 3 finished with value: 0.6240556574546176 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6240556574546176.
[I 2025-09-02 00:15:22,759] Trial 4 finished with value: 0.3888516157888852 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 8, 'min_samples_leaf': 10, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6771
dt test accuracy: 0.5270
dt test F1 (positive): 0.4724

OUTER FOLD 2/5
Train size: 1173, Test size: 387
Class distribution in test set: {'non-void': np.int64(295), 'void': np.int64(92)}

--- Optimizing RF ---


[I 2025-09-02 00:15:27,590] Trial 0 finished with value: 0.6578497472100836 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6578497472100836.
[I 2025-09-02 00:15:28,861] Trial 1 finished with value: 0.6876359051181044 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6876359051181044.
[I 2025-09-02 00:15:34,307] Trial 2 finished with value: 0.6665762578949002 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6876359051181044.
[I 2025-09-02 00:15:40,067] Trial 3 finished with value: 0.6642757215924042 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 354, 'max_depth': 3, 'min_samples_split': 19, 'min_samples_leaf': 8, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6969


[I 2025-09-02 00:19:06,247] A new study created in memory with name: no-name-53cea81d-af2e-4ad5-8d7b-ab15e357f5ac


rf test accuracy: 0.6977
rf test F1 (positive): 0.5745

--- Optimizing XGB ---


[I 2025-09-02 00:19:08,786] Trial 0 finished with value: 0.6268732380465377 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6268732380465377.
[I 2025-09-02 00:19:10,468] Trial 1 finished with value: 0.6081345329819886 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6268732380465377.
[I 2025-09-02 00:19:12,177] Trial 2 finished with value: 0.6148287461155264 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 483, 'max_depth': 6, 'learning_rate': 0.012334908058927596, 'subsample': 0.9767468597751854, 'colsample_bytree': 0.8204561954021153, 'min_child_weight': 5, 'gamma': 4.98368075374295, 'reg_alpha': 1.7375863699933205, 'reg_lambda': 1.7310883983441585}
Best xgb F1 score (positive class): 0.6947


[I 2025-09-02 00:21:28,598] A new study created in memory with name: no-name-46393296-7ab8-4d3c-a3ab-e1a84bc966ae
[I 2025-09-02 00:21:28,637] Trial 0 finished with value: 0.5795173983468668 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5795173983468668.


xgb test accuracy: 0.7442
xgb test F1 (positive): 0.5308

--- Optimizing DT ---


[I 2025-09-02 00:21:28,939] Trial 1 finished with value: 0.5687602907756011 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5795173983468668.
[I 2025-09-02 00:21:28,976] Trial 2 finished with value: 0.6210584531435522 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6210584531435522.
[I 2025-09-02 00:21:29,002] Trial 3 finished with value: 0.6366591688157873 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6366591688157873.
[I 2025-09-02 00:21:29,026] Trial 4 finished with value: 0.6745371338456444 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 4, 'min_samples_split': 16, 'min_samples_leaf': 7, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6801
dt test accuracy: 0.7313
dt test F1 (positive): 0.5873

OUTER FOLD 3/5
Train size: 1320, Test size: 240
Class distribution in test set: {'non-void': np.int64(126), 'void': np.int64(114)}

--- Optimizing RF ---


[I 2025-09-02 00:21:32,103] Trial 0 finished with value: 0.6030586598023455 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6030586598023455.
[I 2025-09-02 00:21:33,409] Trial 1 finished with value: 0.6444790048506511 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6444790048506511.
[I 2025-09-02 00:21:39,706] Trial 2 finished with value: 0.6201076907052608 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6444790048506511.
[I 2025-09-02 00:21:46,247] Trial 3 finished with value: 0.6249689531947669 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 394, 'max_depth': 3, 'min_samples_split': 18, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6463


[I 2025-09-02 00:23:46,027] A new study created in memory with name: no-name-805edd54-dfc9-4fd4-a502-da5b5424fef0


rf test accuracy: 0.6625
rf test F1 (positive): 0.5759

--- Optimizing XGB ---


[I 2025-09-02 00:23:48,732] Trial 0 finished with value: 0.5827609918613703 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5827609918613703.
[I 2025-09-02 00:23:50,519] Trial 1 finished with value: 0.5828939984641739 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5828939984641739.
[I 2025-09-02 00:23:52,262] Trial 2 finished with value: 0.5994049039376769 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 448, 'max_depth': 5, 'learning_rate': 0.014595740084542603, 'subsample': 0.7646944513303342, 'colsample_bytree': 0.7278922423975088, 'min_child_weight': 7, 'gamma': 4.591516909721552, 'reg_alpha': 1.9991183681841573, 'reg_lambda': 1.1495662000362536}
Best xgb F1 score (positive class): 0.6265


[I 2025-09-02 00:25:50,402] A new study created in memory with name: no-name-ded1f497-6d3d-4e78-9933-bf07aba7b993
[I 2025-09-02 00:25:50,440] Trial 0 finished with value: 0.5504630854813253 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5504630854813253.


xgb test accuracy: 0.6583
xgb test F1 (positive): 0.5941

--- Optimizing DT ---


[I 2025-09-02 00:25:50,789] Trial 1 finished with value: 0.5221586960056027 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5504630854813253.
[I 2025-09-02 00:25:50,827] Trial 2 finished with value: 0.55839575989663 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.55839575989663.
[I 2025-09-02 00:25:50,853] Trial 3 finished with value: 0.6566389568052159 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6566389568052159.
[I 2025-09-02 00:25:50,876] Trial 4 finished with value: 0.6204626432119004 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_feat

Best dt params: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 13, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6578
dt test accuracy: 0.6458
dt test F1 (positive): 0.5550

OUTER FOLD 4/5
Train size: 1178, Test size: 382
Class distribution in test set: {'non-void': np.int64(223), 'void': np.int64(159)}

--- Optimizing RF ---


[I 2025-09-02 00:25:54,101] Trial 0 finished with value: 0.6205294341206634 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6205294341206634.
[I 2025-09-02 00:25:55,360] Trial 1 finished with value: 0.6514600234439376 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6514600234439376.
[I 2025-09-02 00:26:00,635] Trial 2 finished with value: 0.6018714657797937 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6514600234439376.
[I 2025-09-02 00:26:05,998] Trial 3 finished with value: 0.6183258768484682 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 469, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6538


[I 2025-09-02 00:27:48,226] A new study created in memory with name: no-name-bff5bc40-35e8-4c58-a5d4-ed7aa28ce62a


rf test accuracy: 0.6937
rf test F1 (positive): 0.6686

--- Optimizing XGB ---


[I 2025-09-02 00:27:50,768] Trial 0 finished with value: 0.5853369259207613 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5853369259207613.
[I 2025-09-02 00:27:52,599] Trial 1 finished with value: 0.5489007220488702 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5853369259207613.
[I 2025-09-02 00:27:54,804] Trial 2 finished with value: 0.5763326410522672 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 299, 'max_depth': 3, 'learning_rate': 0.013809176019878846, 'subsample': 0.6577780577663715, 'colsample_bytree': 0.6465255811631712, 'min_child_weight': 3, 'gamma': 4.9908772787626186, 'reg_alpha': 1.2826122543957705, 'reg_lambda': 1.3752224749575765}
Best xgb F1 score (positive class): 0.6403


[I 2025-09-02 00:29:19,837] A new study created in memory with name: no-name-a929b0c9-26c4-4822-adff-eb91e29c891c
[I 2025-09-02 00:29:19,874] Trial 0 finished with value: 0.5396891118250566 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5396891118250566.


xgb test accuracy: 0.6937
xgb test F1 (positive): 0.6777

--- Optimizing DT ---


[I 2025-09-02 00:29:20,154] Trial 1 finished with value: 0.5076473985569171 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5396891118250566.
[I 2025-09-02 00:29:20,191] Trial 2 finished with value: 0.603417181385261 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.603417181385261.
[I 2025-09-02 00:29:20,217] Trial 3 finished with value: 0.5358761315815567 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.603417181385261.
[I 2025-09-02 00:29:20,240] Trial 4 finished with value: 0.6491180288568755 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_fea

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 9, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'random'}
Best dt F1 score (positive class): 0.6502
dt test accuracy: 0.5969
dt test F1 (positive): 0.6500

OUTER FOLD 5/5
Train size: 1231, Test size: 329
Class distribution in test set: {'non-void': np.int64(170), 'void': np.int64(159)}

--- Optimizing RF ---


[I 2025-09-02 00:29:23,313] Trial 0 finished with value: 0.5428387630894491 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5428387630894491.
[I 2025-09-02 00:29:24,625] Trial 1 finished with value: 0.5852861151431378 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5852861151431378.
[I 2025-09-02 00:29:30,469] Trial 2 finished with value: 0.552553055193933 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5852861151431378.
[I 2025-09-02 00:29:36,499] Trial 3 finished with value: 0.5572251190594757 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 135, 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 10, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6434


[I 2025-09-02 00:31:40,142] A new study created in memory with name: no-name-d222b205-62ae-42f5-83b7-bb5dd42a4403


rf test accuracy: 0.7781
rf test F1 (positive): 0.7978

--- Optimizing XGB ---


[I 2025-09-02 00:31:42,749] Trial 0 finished with value: 0.5445692729200226 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5445692729200226.
[I 2025-09-02 00:31:44,561] Trial 1 finished with value: 0.5333214619057397 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5445692729200226.
[I 2025-09-02 00:31:46,157] Trial 2 finished with value: 0.5571532637121003 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 476, 'max_depth': 9, 'learning_rate': 0.029323105618991638, 'subsample': 0.6071847502459278, 'colsample_bytree': 0.9924283304357214, 'min_child_weight': 7, 'gamma': 4.865188803848123, 'reg_alpha': 1.2481670543447305, 'reg_lambda': 0.07959921215402954}
Best xgb F1 score (positive class): 0.5764


[I 2025-09-02 00:33:31,476] A new study created in memory with name: no-name-0848c828-8add-4054-a47d-62f7a9492172
[I 2025-09-02 00:33:31,516] Trial 0 finished with value: 0.47051675977181384 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.47051675977181384.


xgb test accuracy: 0.7538
xgb test F1 (positive): 0.7216

--- Optimizing DT ---


[I 2025-09-02 00:33:31,862] Trial 1 finished with value: 0.43579108019631513 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.47051675977181384.
[I 2025-09-02 00:33:31,898] Trial 2 finished with value: 0.4901775211372735 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.4901775211372735.
[I 2025-09-02 00:33:31,923] Trial 3 finished with value: 0.5811974851636407 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.5811974851636407.
[I 2025-09-02 00:33:31,947] Trial 4 finished with value: 0.6164337137788465 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'ma

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 17, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6516
dt test accuracy: 0.7781
dt test F1 (positive): 0.7978

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.6718 Â± 0.0915
f1_positive       : 0.6209 Â± 0.1177
precision_positive: 0.6125 Â± 0.1156
recall_positive   : 0.6804 Â± 0.2219
f1_macro          : 0.6620 Â± 0.0910
Individual fold accuracies: ['0.5270', '0.6977', '0.6625', '0.6937', '0.7781']
Individual fold F1 (pos): ['0.4878', '0.5745', '0.5759', '0.6686', '0.7978']

XGB Results:
----------------------------------------
accuracy          : 0.6682 Â± 0.1064
f1_positive       : 0.5840 Â± 0.1286
precision_positive: 0.6223 Â± 0.1232
recall_positive   : 0.5750 Â± 0.1751
f1_macro          : 0.6497 Â± 0.1028
Individual fold accuracies: ['0.4910', '0.7442', '

[I 2025-09-02 00:33:38,356] Trial 0 finished with value: 0.6624743406296915 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6624743406296915.
[I 2025-09-02 00:33:40,293] Trial 1 finished with value: 0.6816401031694336 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6816401031694336.
[I 2025-09-02 00:33:55,882] Trial 2 finished with value: 0.6498145004087279 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6816401031694336.
[I 2025-09-02 00:34:15,158] Trial 3 finished with value: 0.6375260353400812 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 187, 'max_depth': 4, 'min_samples_split': 15, 'min_samples_leaf': 5, 'max_features': 'log2', 'bootstrap': True}
Best rf F1 score (positive class): 0.6869


[I 2025-09-02 00:37:37,595] A new study created in memory with name: no-name-beb04b96-56fd-4692-bfd8-1a3f1bb3541e


rf test accuracy: 0.6162
rf test F1 (positive): 0.5523

--- Optimizing XGB ---


[I 2025-09-02 00:37:41,554] Trial 0 finished with value: 0.6344189594221445 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6344189594221445.
[I 2025-09-02 00:37:43,819] Trial 1 finished with value: 0.6101661603608365 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6344189594221445.
[I 2025-09-02 00:37:46,337] Trial 2 finished with value: 0.6305288149368206 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 322, 'max_depth': 7, 'learning_rate': 0.0380476508590428, 'subsample': 0.8142937359963967, 'colsample_bytree': 0.7038210687659125, 'min_child_weight': 4, 'gamma': 3.865243379334843, 'reg_alpha': 1.8116734212404515, 'reg_lambda': 1.1707309681753792}
Best xgb F1 score (positive class): 0.6558


[I 2025-09-02 00:41:08,316] A new study created in memory with name: no-name-fb091fda-0f28-492b-a87b-b95063364804
[I 2025-09-02 00:41:08,403] Trial 0 finished with value: 0.5557229512336864 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5557229512336864.


xgb test accuracy: 0.6232
xgb test F1 (positive): 0.5417

--- Optimizing DT ---


[I 2025-09-02 00:41:09,306] Trial 1 finished with value: 0.48417985362684207 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5557229512336864.
[I 2025-09-02 00:41:09,375] Trial 2 finished with value: 0.5233201394465417 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.5557229512336864.
[I 2025-09-02 00:41:09,415] Trial 3 finished with value: 0.6843674796074054 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6843674796074054.
[I 2025-09-02 00:41:09,449] Trial 4 finished with value: 0.6558961252805199 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 7, 'min_samples_leaf': 5, 'max_features': None, 'splitter': 'random'}
Best dt F1 score (positive class): 0.6923
dt test accuracy: 0.6625
dt test F1 (positive): 0.6240

OUTER FOLD 2/5
Train size: 3255, Test size: 635
Class distribution in test set: {'non-void': np.int64(359), 'void': np.int64(276)}

--- Optimizing RF ---


[I 2025-09-02 00:41:15,172] Trial 0 finished with value: 0.6265956776599277 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6265956776599277.
[I 2025-09-02 00:41:17,316] Trial 1 finished with value: 0.6530093035996919 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6530093035996919.
[I 2025-09-02 00:41:34,597] Trial 2 finished with value: 0.6308402313048074 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6530093035996919.
[I 2025-09-02 00:41:56,305] Trial 3 finished with value: 0.6265504843136884 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6530


[I 2025-09-02 00:46:01,356] A new study created in memory with name: no-name-dac9ddbc-31b1-4918-89a2-95de5f5079dc


rf test accuracy: 0.7008
rf test F1 (positive): 0.6667

--- Optimizing XGB ---


[I 2025-09-02 00:46:05,732] Trial 0 finished with value: 0.6155755467495905 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6155755467495905.
[I 2025-09-02 00:46:08,357] Trial 1 finished with value: 0.6257685688532343 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.6257685688532343.
[I 2025-09-02 00:46:10,768] Trial 2 finished with value: 0.6105350965526138 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 90, 'max_depth': 11, 'learning_rate': 0.07407914089939316, 'subsample': 0.8932717448732964, 'colsample_bytree': 0.647431934053385, 'min_child_weight': 1, 'gamma': 1.9205393339580246, 'reg_alpha': 0.20106670485807218, 'reg_lambda': 1.8547177136123283}
Best xgb F1 score (positive class): 0.6340


[I 2025-09-02 00:49:19,466] A new study created in memory with name: no-name-4778bdf2-2a89-4bac-a0a5-d787727fda3e
[I 2025-09-02 00:49:19,536] Trial 0 finished with value: 0.5607216402888547 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5607216402888547.


xgb test accuracy: 0.6394
xgb test F1 (positive): 0.5903

--- Optimizing DT ---


[I 2025-09-02 00:49:20,485] Trial 1 finished with value: 0.5688313426769854 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5688313426769854.
[I 2025-09-02 00:49:20,555] Trial 2 finished with value: 0.5661376056503982 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5688313426769854.
[I 2025-09-02 00:49:20,595] Trial 3 finished with value: 0.5046557745193455 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5688313426769854.
[I 2025-09-02 00:49:20,629] Trial 4 finished with value: 0.5975308510442164 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 16, 'min_samples_leaf': 9, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6848
dt test accuracy: 0.6803
dt test F1 (positive): 0.6710

OUTER FOLD 3/5
Train size: 3053, Test size: 837
Class distribution in test set: {'non-void': np.int64(460), 'void': np.int64(377)}

--- Optimizing RF ---


[I 2025-09-02 00:49:33,436] Trial 0 finished with value: 0.5838091658017037 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5838091658017037.
[I 2025-09-02 00:49:35,544] Trial 1 finished with value: 0.633058355259069 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.633058355259069.
[I 2025-09-02 00:49:51,535] Trial 2 finished with value: 0.6056027242282758 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.633058355259069.
[I 2025-09-02 00:50:11,160] Trial 3 finished with value: 0.5915587548410184 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features':

Best rf params: {'n_estimators': 381, 'max_depth': 3, 'min_samples_split': 5, 'min_samples_leaf': 10, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6665


[I 2025-09-02 00:58:08,809] A new study created in memory with name: no-name-79e86df9-3af0-403d-a8bb-8fcbfbee44db


rf test accuracy: 0.6153
rf test F1 (positive): 0.4806

--- Optimizing XGB ---


[I 2025-09-02 00:58:12,789] Trial 0 finished with value: 0.5872659853263495 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5872659853263495.
[I 2025-09-02 00:58:15,176] Trial 1 finished with value: 0.5634534102172895 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5872659853263495.
[I 2025-09-02 00:58:17,634] Trial 2 finished with value: 0.5995594455731305 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 308, 'max_depth': 3, 'learning_rate': 0.012233786724800038, 'subsample': 0.940087495052042, 'colsample_bytree': 0.6568367512072792, 'min_child_weight': 8, 'gamma': 2.550653888377429, 'reg_alpha': 1.8052169864032344, 'reg_lambda': 1.533484488932477}
Best xgb F1 score (positive class): 0.6371


[I 2025-09-02 01:01:23,966] A new study created in memory with name: no-name-74b22040-fa13-4828-bab1-4ae1d6a5cb7c
[I 2025-09-02 01:01:24,029] Trial 0 finished with value: 0.48730871189101904 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.48730871189101904.


xgb test accuracy: 0.6750
xgb test F1 (positive): 0.5763

--- Optimizing DT ---


[I 2025-09-02 01:01:24,817] Trial 1 finished with value: 0.5298129868714442 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5298129868714442.
[I 2025-09-02 01:01:24,881] Trial 2 finished with value: 0.6088025985612854 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6088025985612854.
[I 2025-09-02 01:01:24,919] Trial 3 finished with value: 0.6568060060547581 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6568060060547581.
[I 2025-09-02 01:01:24,952] Trial 4 finished with value: 0.6485415994780598 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 11, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6761
dt test accuracy: 0.6153
dt test F1 (positive): 0.4806

OUTER FOLD 4/5
Train size: 3089, Test size: 801
Class distribution in test set: {'non-void': np.int64(501), 'void': np.int64(300)}

--- Optimizing RF ---


[I 2025-09-02 01:01:35,397] Trial 0 finished with value: 0.6253926995144683 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6253926995144683.
[I 2025-09-02 01:01:37,420] Trial 1 finished with value: 0.6262752542104769 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6262752542104769.
[I 2025-09-02 01:01:52,912] Trial 2 finished with value: 0.6314514612512735 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 2 with value: 0.6314514612512735.
[I 2025-09-02 01:02:11,592] Trial 3 finished with value: 0.6200283811068555 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 445, 'max_depth': 10, 'min_samples_split': 14, 'min_samples_leaf': 2, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6408


[I 2025-09-02 01:04:56,420] A new study created in memory with name: no-name-91f82de5-4020-4503-9e4b-ce68ca8edd12


rf test accuracy: 0.7603
rf test F1 (positive): 0.7225

--- Optimizing XGB ---


[I 2025-09-02 01:05:00,654] Trial 0 finished with value: 0.5970174912592795 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5970174912592795.
[I 2025-09-02 01:05:03,074] Trial 1 finished with value: 0.5902276678726115 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5970174912592795.
[I 2025-09-02 01:05:05,533] Trial 2 finished with value: 0.605256982981917 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.6

Best xgb params: {'n_estimators': 229, 'max_depth': 3, 'learning_rate': 0.011094598354660047, 'subsample': 0.8751687485453679, 'colsample_bytree': 0.8426745672785929, 'min_child_weight': 2, 'gamma': 2.1829907027427176, 'reg_alpha': 0.8151976277110418, 'reg_lambda': 1.0960170876202544}
Best xgb F1 score (positive class): 0.6265


[I 2025-09-02 01:08:10,017] A new study created in memory with name: no-name-87fecf2c-7fb2-4bdd-8cf3-bf0a0b194164
[I 2025-09-02 01:08:10,085] Trial 0 finished with value: 0.5704907253876326 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5704907253876326.


xgb test accuracy: 0.7765
xgb test F1 (positive): 0.7578

--- Optimizing DT ---


[I 2025-09-02 01:08:10,919] Trial 1 finished with value: 0.4971361526768736 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5704907253876326.
[I 2025-09-02 01:08:10,984] Trial 2 finished with value: 0.5273261435808325 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.5704907253876326.
[I 2025-09-02 01:08:11,023] Trial 3 finished with value: 0.5969581414830714 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.5969581414830714.
[I 2025-09-02 01:08:11,055] Trial 4 finished with value: 0.6315894192249396 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 5, 'min_samples_split': 7, 'min_samples_leaf': 10, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6411


[I 2025-09-02 01:08:19,969] A new study created in memory with name: no-name-0a6218e0-65d9-477e-833b-c95cf84eb4dc


dt test accuracy: 0.6954
dt test F1 (positive): 0.6139

OUTER FOLD 5/5
Train size: 2987, Test size: 903
Class distribution in test set: {'non-void': np.int64(563), 'void': np.int64(340)}

--- Optimizing RF ---


[I 2025-09-02 01:08:21,726] Trial 0 finished with value: 0.5545128903488006 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5545128903488006.
[I 2025-09-02 01:08:23,765] Trial 1 finished with value: 0.6201833151391113 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6201833151391113.
[I 2025-09-02 01:08:39,455] Trial 2 finished with value: 0.5430151084190455 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6201833151391113.
[I 2025-09-02 01:08:58,878] Trial 3 finished with value: 0.5321758880879135 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 467, 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 8, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6228


[I 2025-09-02 01:18:32,666] A new study created in memory with name: no-name-05fc326f-2b3c-4743-abe1-4dcb9983dd69


rf test accuracy: 0.7608
rf test F1 (positive): 0.7313

--- Optimizing XGB ---


[I 2025-09-02 01:18:36,748] Trial 0 finished with value: 0.5290841593315977 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5290841593315977.
[I 2025-09-02 01:18:39,041] Trial 1 finished with value: 0.5213187474081433 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5290841593315977.
[I 2025-09-02 01:18:41,518] Trial 2 finished with value: 0.5402583325834968 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 237, 'max_depth': 3, 'learning_rate': 0.015971276731317242, 'subsample': 0.9750065620989762, 'colsample_bytree': 0.8701985937888853, 'min_child_weight': 8, 'gamma': 1.6669718330637786, 'reg_alpha': 0.7001050188182057, 'reg_lambda': 0.24430644980453542}
Best xgb F1 score (positive class): 0.5919


[I 2025-09-02 01:21:08,444] A new study created in memory with name: no-name-a5d5e29a-1020-4c92-afbc-d0abe6c4bb70
[I 2025-09-02 01:21:08,509] Trial 0 finished with value: 0.5414377445651162 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5414377445651162.


xgb test accuracy: 0.7641
xgb test F1 (positive): 0.6835

--- Optimizing DT ---


[I 2025-09-02 01:21:09,348] Trial 1 finished with value: 0.49434970311258813 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5414377445651162.
[I 2025-09-02 01:21:09,411] Trial 2 finished with value: 0.4832831979123789 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.5414377445651162.
[I 2025-09-02 01:21:09,449] Trial 3 finished with value: 0.5946421220541319 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.5946421220541319.
[I 2025-09-02 01:21:09,482] Trial 4 finished with value: 0.6659065526784086 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max

Best dt params: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6659
dt test accuracy: 0.6224
dt test F1 (positive): 0.6510

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.6907 Â± 0.0726
f1_positive       : 0.6307 Â± 0.1101
precision_positive: 0.6239 Â± 0.0231
recall_positive   : 0.6603 Â± 0.2015
f1_macro          : 0.6814 Â± 0.0803
Individual fold accuracies: ['0.6162', '0.7008', '0.6153', '0.7603', '0.7608']
Individual fold F1 (pos): ['0.5523', '0.6667', '0.4806', '0.7225', '0.7313']

XGB Results:
----------------------------------------
accuracy          : 0.6957 Â± 0.0708
f1_positive       : 0.6299 Â± 0.0886
precision_positive: 0.6433 Â± 0.0506
recall_positive   : 0.6375 Â± 0.1831
f1_macro          : 0.6849 Â± 0.0724
Individual fold accuracies: ['0.6232', '0.6394',

[I 2025-09-02 01:21:14,847] Trial 0 finished with value: 0.5971741372241998 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5971741372241998.
[I 2025-09-02 01:21:15,770] Trial 1 finished with value: 0.6153414304993252 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6153414304993252.
[I 2025-09-02 01:21:17,782] Trial 2 finished with value: 0.5713391222163152 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6153414304993252.
[I 2025-09-02 01:21:19,606] Trial 3 finished with value: 0.5875367633486334 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 92, 'max_depth': 3, 'min_samples_split': 10, 'min_samples_leaf': 1, 'max_features': 'sqrt', 'bootstrap': True}
Best rf F1 score (positive class): 0.6320
rf test accuracy: 0.7417
rf test F1 (positive): 0.7207

--- Optimizing XGB ---


[I 2025-09-02 01:21:56,508] Trial 0 finished with value: 0.5737205947809834 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5737205947809834.
[I 2025-09-02 01:21:58,151] Trial 1 finished with value: 0.5659481183777859 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5737205947809834.
[I 2025-09-02 01:21:59,246] Trial 2 finished with value: 0.5706363561927305 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 476, 'max_depth': 9, 'learning_rate': 0.02384124679699214, 'subsample': 0.9729161367647149, 'colsample_bytree': 0.8076576013037925, 'min_child_weight': 7, 'gamma': 4.865417857436737, 'reg_alpha': 1.199831273625152, 'reg_lambda': 1.315924369942073}
Best xgb F1 score (positive class): 0.6105


[I 2025-09-02 01:23:12,294] A new study created in memory with name: no-name-b6905d07-fccc-4a2f-bc03-abc02eac30e8
[I 2025-09-02 01:23:12,316] Trial 0 finished with value: 0.5126620798080975 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5126620798080975.
[I 2025-09-02 01:23:12,414] Trial 1 finished with value: 0.47854451628036526 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5126620798080975.
[I 2025-09-02 01:23:12,436] Trial 2 finished with value: 0.6087516864151447 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6087516864151447.
[I 2025-09-02 01:23:12,455] Trial 3 finished with value: 0.579164396

xgb test accuracy: 0.6750
xgb test F1 (positive): 0.6422

--- Optimizing DT ---


[I 2025-09-02 01:23:12,514] Trial 6 finished with value: 0.5153769316646102 and parameters: {'criterion': 'gini', 'max_depth': 17, 'min_samples_split': 8, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'random'}. Best is trial 2 with value: 0.6087516864151447.
[I 2025-09-02 01:23:12,535] Trial 7 finished with value: 0.6435208240577368 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 7 with value: 0.6435208240577368.
[I 2025-09-02 01:23:12,559] Trial 8 finished with value: 0.5999676610882044 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 7 with value: 0.6435208240577368.
[I 2025-09-02 01:23:12,579] Trial 9 finished with value: 0.45808306629902873 and parameters: {'criterion': 'entropy', 'max_depth': 16, 'min_samples_split': 12, 'min_samples_leaf': 8, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6435
dt test accuracy: 0.6250
dt test F1 (positive): 0.7020

OUTER FOLD 2/5
Train size: 446, Test size: 137
Class distribution in test set: {'non-void': np.int64(89), 'void': np.int64(48)}

--- Optimizing RF ---


[I 2025-09-02 01:23:14,629] Trial 0 finished with value: 0.6094885687855162 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6094885687855162.
[I 2025-09-02 01:23:15,622] Trial 1 finished with value: 0.6121102004367701 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6121102004367701.
[I 2025-09-02 01:23:17,548] Trial 2 finished with value: 0.6009777334427174 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6121102004367701.
[I 2025-09-02 01:23:19,378] Trial 3 finished with value: 0.6214927826578313 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 476, 'max_depth': 3, 'min_samples_split': 7, 'min_samples_leaf': 4, 'max_features': 'log2', 'bootstrap': False}
Best rf F1 score (positive class): 0.6412


[I 2025-09-02 01:24:17,048] A new study created in memory with name: no-name-953b8e68-148b-4722-a028-f9c67f255554


rf test accuracy: 0.7591
rf test F1 (positive): 0.5926

--- Optimizing XGB ---


[I 2025-09-02 01:24:18,405] Trial 0 finished with value: 0.601416936118699 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.601416936118699.
[I 2025-09-02 01:24:20,652] Trial 1 finished with value: 0.5617924528301886 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.601416936118699.
[I 2025-09-02 01:24:21,702] Trial 2 finished with value: 0.5641782382619471 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.655

Best xgb params: {'n_estimators': 325, 'max_depth': 12, 'learning_rate': 0.0253021606894538, 'subsample': 0.6186458766901913, 'colsample_bytree': 0.6032100349746359, 'min_child_weight': 1, 'gamma': 4.75230560116798, 'reg_alpha': 1.7392421525851762, 'reg_lambda': 1.8276761898046916}
Best xgb F1 score (positive class): 0.6413


[I 2025-09-02 01:25:30,606] A new study created in memory with name: no-name-2559a50b-db6e-4857-98fb-b5c9911e64a0
[I 2025-09-02 01:25:30,629] Trial 0 finished with value: 0.49142400956616655 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.49142400956616655.
[I 2025-09-02 01:25:30,721] Trial 1 finished with value: 0.5118173687872384 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5118173687872384.
[I 2025-09-02 01:25:30,743] Trial 2 finished with value: 0.46899469264994226 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5118173687872384.
[I 2025-09-02 01:25:30,761] Trial 3 finished with value: 0.5963992

xgb test accuracy: 0.7664
xgb test F1 (positive): 0.5897

--- Optimizing DT ---


[I 2025-09-02 01:25:30,821] Trial 6 finished with value: 0.6194161142274349 and parameters: {'criterion': 'gini', 'max_depth': 17, 'min_samples_split': 8, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'random'}. Best is trial 4 with value: 0.6289762621686511.
[I 2025-09-02 01:25:30,840] Trial 7 finished with value: 0.6189693608574021 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 4 with value: 0.6289762621686511.
[I 2025-09-02 01:25:30,867] Trial 8 finished with value: 0.5168844450022544 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 4 with value: 0.6289762621686511.
[I 2025-09-02 01:25:30,886] Trial 9 finished with value: 0.5674651336101352 and parameters: {'criterion': 'entropy', 'max_depth': 16, 'min_samples_split': 12, 'min_samples_leaf': 8, 'max_f

Best dt params: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 19, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'random'}
Best dt F1 score (positive class): 0.6413
dt test accuracy: 0.6715
dt test F1 (positive): 0.4828

OUTER FOLD 3/5
Train size: 490, Test size: 93
Class distribution in test set: {'non-void': np.int64(43), 'void': np.int64(50)}

--- Optimizing RF ---


[I 2025-09-02 01:25:33,068] Trial 0 finished with value: 0.6033280958265929 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6033280958265929.
[I 2025-09-02 01:25:33,984] Trial 1 finished with value: 0.6045716367967721 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6045716367967721.
[I 2025-09-02 01:25:36,103] Trial 2 finished with value: 0.6193302546243723 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 2 with value: 0.6193302546243723.
[I 2025-09-02 01:25:38,069] Trial 3 finished with value: 0.6164597042828137 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 462, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6422


[I 2025-09-02 01:27:12,770] A new study created in memory with name: no-name-8d53a3c0-3e45-4817-99d3-4c305165e095


rf test accuracy: 0.6774
rf test F1 (positive): 0.6429

--- Optimizing XGB ---


[I 2025-09-02 01:27:14,217] Trial 0 finished with value: 0.600103680914327 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.600103680914327.
[I 2025-09-02 01:27:15,947] Trial 1 finished with value: 0.5801238911677243 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.600103680914327.
[I 2025-09-02 01:27:16,948] Trial 2 finished with value: 0.5835880435959636 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.655

Best xgb params: {'n_estimators': 337, 'max_depth': 7, 'learning_rate': 0.19178540972667618, 'subsample': 0.8809192537925273, 'colsample_bytree': 0.6327381995694799, 'min_child_weight': 1, 'gamma': 0.41793109132985834, 'reg_alpha': 0.34710650187239867, 'reg_lambda': 1.0357647096994267}
Best xgb F1 score (positive class): 0.6167


[I 2025-09-02 01:28:30,456] A new study created in memory with name: no-name-89ab49b3-3474-4d6f-aeb8-71032e6dfdd9
[I 2025-09-02 01:28:30,479] Trial 0 finished with value: 0.47858881641740875 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.47858881641740875.
[I 2025-09-02 01:28:30,589] Trial 1 finished with value: 0.5416928436714001 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5416928436714001.
[I 2025-09-02 01:28:30,612] Trial 2 finished with value: 0.6312315995439765 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6312315995439765.
[I 2025-09-02 01:28:30,633] Trial 3 finished with value: 0.55672558

xgb test accuracy: 0.5914
xgb test F1 (positive): 0.4865

--- Optimizing DT ---


[I 2025-09-02 01:28:30,670] Trial 5 finished with value: 0.5803478918340603 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'splitter': 'random'}. Best is trial 4 with value: 0.6351638995317156.
[I 2025-09-02 01:28:30,696] Trial 6 finished with value: 0.5337896233618159 and parameters: {'criterion': 'gini', 'max_depth': 17, 'min_samples_split': 8, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'random'}. Best is trial 4 with value: 0.6351638995317156.
[I 2025-09-02 01:28:30,716] Trial 7 finished with value: 0.6144349477682811 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 4 with value: 0.6351638995317156.
[I 2025-09-02 01:28:30,738] Trial 8 finished with value: 0.5141161500483534 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_fe

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 16, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6558
dt test accuracy: 0.6559
dt test F1 (positive): 0.6444

OUTER FOLD 4/5
Train size: 475, Test size: 108
Class distribution in test set: {'non-void': np.int64(67), 'void': np.int64(41)}

--- Optimizing RF ---


[I 2025-09-02 01:28:32,742] Trial 0 finished with value: 0.6554285714285715 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6554285714285715.
[I 2025-09-02 01:28:33,674] Trial 1 finished with value: 0.6835224811867251 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6835224811867251.
[I 2025-09-02 01:28:35,692] Trial 2 finished with value: 0.6575449755109549 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6835224811867251.
[I 2025-09-02 01:28:37,659] Trial 3 finished with value: 0.6860481059270577 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 247, 'max_depth': 4, 'min_samples_split': 17, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6968


[I 2025-09-02 01:29:35,178] A new study created in memory with name: no-name-8a5b8afb-5605-4dd1-aad4-2476bc7283b0


rf test accuracy: 0.6481
rf test F1 (positive): 0.6346

--- Optimizing XGB ---


[I 2025-09-02 01:29:36,628] Trial 0 finished with value: 0.593758227016099 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.593758227016099.
[I 2025-09-02 01:29:38,371] Trial 1 finished with value: 0.5925759342550946 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.593758227016099.
[I 2025-09-02 01:29:39,361] Trial 2 finished with value: 0.6107109182662627 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.655

Best xgb params: {'n_estimators': 381, 'max_depth': 4, 'learning_rate': 0.019847338137917225, 'subsample': 0.9563624876978447, 'colsample_bytree': 0.8927937416625484, 'min_child_weight': 3, 'gamma': 4.567426695951508, 'reg_alpha': 1.617200145324437, 'reg_lambda': 1.2777192444248844}
Best xgb F1 score (positive class): 0.6687


[I 2025-09-02 01:30:58,379] A new study created in memory with name: no-name-0284043e-da08-49c7-97dd-76d90fc652a4
[I 2025-09-02 01:30:58,402] Trial 0 finished with value: 0.5265641749679714 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5265641749679714.
[I 2025-09-02 01:30:58,504] Trial 1 finished with value: 0.5168959151220792 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5265641749679714.
[I 2025-09-02 01:30:58,527] Trial 2 finished with value: 0.5074282280572753 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.5265641749679714.
[I 2025-09-02 01:30:58,546] Trial 3 finished with value: 0.6729914529

xgb test accuracy: 0.6574
xgb test F1 (positive): 0.6408

--- Optimizing DT ---


[I 2025-09-02 01:30:58,582] Trial 5 finished with value: 0.5558564793917325 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'splitter': 'random'}. Best is trial 3 with value: 0.6729914529914529.
[I 2025-09-02 01:30:58,606] Trial 6 finished with value: 0.550460285982674 and parameters: {'criterion': 'gini', 'max_depth': 17, 'min_samples_split': 8, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'random'}. Best is trial 3 with value: 0.6729914529914529.
[I 2025-09-02 01:30:58,627] Trial 7 finished with value: 0.6324435909400051 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 3 with value: 0.6729914529914529.
[I 2025-09-02 01:30:58,650] Trial 8 finished with value: 0.451999266400737 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_feat

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 14, 'min_samples_leaf': 8, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6842
dt test accuracy: 0.6389
dt test F1 (positive): 0.6486

OUTER FOLD 5/5
Train size: 458, Test size: 125
Class distribution in test set: {'non-void': np.int64(81), 'void': np.int64(44)}

--- Optimizing RF ---


[I 2025-09-02 01:31:00,904] Trial 0 finished with value: 0.6652777777777779 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6652777777777779.
[I 2025-09-02 01:31:01,827] Trial 1 finished with value: 0.6592877569602072 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 0 with value: 0.6652777777777779.
[I 2025-09-02 01:31:03,777] Trial 2 finished with value: 0.659822940235039 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 0 with value: 0.6652777777777779.
[I 2025-09-02 01:31:05,594] Trial 3 finished with value: 0.6492653688497013 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 137, 'max_depth': 14, 'min_samples_split': 7, 'min_samples_leaf': 4, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6752
rf test accuracy: 0.7680
rf test F1 (positive): 0.6813

--- Optimizing XGB ---


[I 2025-09-02 01:31:50,536] Trial 0 finished with value: 0.6189415847310585 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6189415847310585.
[I 2025-09-02 01:31:52,198] Trial 1 finished with value: 0.5869331247184886 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6189415847310585.
[I 2025-09-02 01:31:53,213] Trial 2 finished with value: 0.6201673709503687 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 118, 'max_depth': 8, 'learning_rate': 0.02986829042381973, 'subsample': 0.7599669359815587, 'colsample_bytree': 0.8250122810664506, 'min_child_weight': 1, 'gamma': 4.847256739455992, 'reg_alpha': 1.2143685480664512, 'reg_lambda': 1.3761977960261167}
Best xgb F1 score (positive class): 0.6572


[I 2025-09-02 01:32:59,523] A new study created in memory with name: no-name-65d1da91-7d62-4e20-9eba-a87a232d08e0
[I 2025-09-02 01:32:59,546] Trial 0 finished with value: 0.4782815273800017 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4782815273800017.
[I 2025-09-02 01:32:59,653] Trial 1 finished with value: 0.5514037406383916 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5514037406383916.
[I 2025-09-02 01:32:59,677] Trial 2 finished with value: 0.4885068532258116 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5514037406383916.
[I 2025-09-02 01:32:59,696] Trial 3 finished with value: 0.5027354498

xgb test accuracy: 0.7600
xgb test F1 (positive): 0.6875

--- Optimizing DT ---


[I 2025-09-02 01:32:59,735] Trial 5 finished with value: 0.5428516642108875 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'splitter': 'random'}. Best is trial 4 with value: 0.6593320513879223.
[I 2025-09-02 01:32:59,759] Trial 6 finished with value: 0.5540215625461528 and parameters: {'criterion': 'gini', 'max_depth': 17, 'min_samples_split': 8, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'random'}. Best is trial 4 with value: 0.6593320513879223.
[I 2025-09-02 01:32:59,779] Trial 7 finished with value: 0.6331114365597125 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 4 with value: 0.6593320513879223.
[I 2025-09-02 01:32:59,802] Trial 8 finished with value: 0.5275764551269125 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_fe

Best dt params: {'criterion': 'entropy', 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 3, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6783
dt test accuracy: 0.7200
dt test F1 (positive): 0.7009

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7189 Â± 0.0531
f1_positive       : 0.6544 Â± 0.0487
precision_positive: 0.6838 Â± 0.1015
recall_positive   : 0.6553 Â± 0.1298
f1_macro          : 0.7045 Â± 0.0432
Individual fold accuracies: ['0.7417', '0.7591', '0.6774', '0.6481', '0.7680']
Individual fold F1 (pos): ['0.7207', '0.5926', '0.6429', '0.6346', '0.6813']

XGB Results:
----------------------------------------
accuracy          : 0.6900 Â± 0.0737
f1_positive       : 0.6093 Â± 0.0769
precision_positive: 0.6663 Â± 0.0954
recall_positive   : 0.6061 Â± 0.1856
f1_macro          : 0.6724 Â± 0.0655
Individual fold accuracies: ['0.6750', '0.7664',

[I 2025-09-02 01:33:02,243] Trial 0 finished with value: 0.5403828373725584 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5403828373725584.
[I 2025-09-02 01:33:03,385] Trial 1 finished with value: 0.5561258916522075 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5561258916522075.
[I 2025-09-02 01:33:07,606] Trial 2 finished with value: 0.5482869891795015 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5561258916522075.
[I 2025-09-02 01:33:11,786] Trial 3 finished with value: 0.5535291969401763 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 85, 'max_depth': 5, 'min_samples_split': 11, 'min_samples_leaf': 3, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.5751


[I 2025-09-02 01:34:33,477] A new study created in memory with name: no-name-3dad1e17-7f43-440e-b179-bf79a98adc46


rf test accuracy: 0.7822
rf test F1 (positive): 0.7135

--- Optimizing XGB ---


[I 2025-09-02 01:34:35,618] Trial 0 finished with value: 0.5648488350207258 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5648488350207258.
[I 2025-09-02 01:34:37,451] Trial 1 finished with value: 0.5556921835298501 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5648488350207258.
[I 2025-09-02 01:34:38,943] Trial 2 finished with value: 0.5620138478165342 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 255, 'max_depth': 7, 'learning_rate': 0.13102429503540533, 'subsample': 0.6378636106676994, 'colsample_bytree': 0.7899857023931112, 'min_child_weight': 2, 'gamma': 1.0701754259499836, 'reg_alpha': 1.4280808431106862, 'reg_lambda': 0.15119000388643364}
Best xgb F1 score (positive class): 0.5757


[I 2025-09-02 01:36:00,809] A new study created in memory with name: no-name-a46cd77a-e418-4440-974e-55d7c2586702
[I 2025-09-02 01:36:00,841] Trial 0 finished with value: 0.4683793580309397 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4683793580309397.


xgb test accuracy: 0.7289
xgb test F1 (positive): 0.5612

--- Optimizing DT ---


[I 2025-09-02 01:36:01,055] Trial 1 finished with value: 0.5092203548085901 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5092203548085901.
[I 2025-09-02 01:36:01,085] Trial 2 finished with value: 0.5663217877853519 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5663217877853519.
[I 2025-09-02 01:36:01,107] Trial 3 finished with value: 0.6061678412555606 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6061678412555606.
[I 2025-09-02 01:36:01,127] Trial 4 finished with value: 0.6451684405172777 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 9, 'min_samples_leaf': 2, 'max_features': 'log2', 'splitter': 'random'}
Best dt F1 score (positive class): 0.6575
dt test accuracy: 0.7289
dt test F1 (positive): 0.6839

OUTER FOLD 2/5
Train size: 964, Test size: 184
Class distribution in test set: {'non-void': np.int64(114), 'void': np.int64(70)}

--- Optimizing RF ---


[I 2025-09-02 01:36:03,891] Trial 0 finished with value: 0.6541241925283927 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6541241925283927.
[I 2025-09-02 01:36:04,998] Trial 1 finished with value: 0.6509883110346271 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 0 with value: 0.6541241925283927.
[I 2025-09-02 01:36:09,201] Trial 2 finished with value: 0.6501534936102306 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 0 with value: 0.6541241925283927.
[I 2025-09-02 01:36:13,393] Trial 3 finished with value: 0.6465567941594642 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 142, 'max_depth': 7, 'min_samples_split': 14, 'min_samples_leaf': 3, 'max_features': 'log2', 'bootstrap': True}
Best rf F1 score (positive class): 0.6743


[I 2025-09-02 01:37:27,109] A new study created in memory with name: no-name-d45a9b58-efc2-4496-8dac-868a01c93f29


rf test accuracy: 0.5870
rf test F1 (positive): 0.3968

--- Optimizing XGB ---


[I 2025-09-02 01:37:29,262] Trial 0 finished with value: 0.6262545926792751 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6262545926792751.
[I 2025-09-02 01:37:31,043] Trial 1 finished with value: 0.6034950247753016 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6262545926792751.
[I 2025-09-02 01:37:33,011] Trial 2 finished with value: 0.6115761708770083 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 472, 'max_depth': 10, 'learning_rate': 0.012760440114602511, 'subsample': 0.7079831532336376, 'colsample_bytree': 0.692907634161448, 'min_child_weight': 9, 'gamma': 4.467508854122687, 'reg_alpha': 1.3757398889626218, 'reg_lambda': 1.24743573065857}
Best xgb F1 score (positive class): 0.6560


[I 2025-09-02 01:39:41,514] A new study created in memory with name: no-name-c98e6faa-adfc-405c-a19a-90ad6cc38136
[I 2025-09-02 01:39:41,545] Trial 0 finished with value: 0.5762145262145263 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5762145262145263.


xgb test accuracy: 0.6304
xgb test F1 (positive): 0.4688

--- Optimizing DT ---


[I 2025-09-02 01:39:41,776] Trial 1 finished with value: 0.5185856678665407 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5762145262145263.
[I 2025-09-02 01:39:41,805] Trial 2 finished with value: 0.6233435156900861 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6233435156900861.
[I 2025-09-02 01:39:41,827] Trial 3 finished with value: 0.6303673228606737 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6303673228606737.
[I 2025-09-02 01:39:41,848] Trial 4 finished with value: 0.6246719984093722 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 4, 'min_samples_split': 16, 'min_samples_leaf': 10, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6656
dt test accuracy: 0.5870
dt test F1 (positive): 0.5476

OUTER FOLD 3/5
Train size: 908, Test size: 240
Class distribution in test set: {'non-void': np.int64(145), 'void': np.int64(95)}

--- Optimizing RF ---


[I 2025-09-02 01:39:44,672] Trial 0 finished with value: 0.5955516261233019 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5955516261233019.
[I 2025-09-02 01:39:45,876] Trial 1 finished with value: 0.6263566802684534 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6263566802684534.
[I 2025-09-02 01:39:49,967] Trial 2 finished with value: 0.6203918464381107 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6263566802684534.
[I 2025-09-02 01:39:53,951] Trial 3 finished with value: 0.6098038483859187 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 77, 'max_depth': 3, 'min_samples_split': 4, 'min_samples_leaf': 2, 'max_features': 'sqrt', 'bootstrap': True}
Best rf F1 score (positive class): 0.6533
rf test accuracy: 0.7250
rf test F1 (positive): 0.6733

--- Optimizing XGB ---


[I 2025-09-02 01:40:45,102] Trial 0 finished with value: 0.5813641196791389 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5813641196791389.
[I 2025-09-02 01:40:46,967] Trial 1 finished with value: 0.5949781156821711 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5949781156821711.
[I 2025-09-02 01:40:48,494] Trial 2 finished with value: 0.5986396329012854 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 281, 'max_depth': 8, 'learning_rate': 0.011711509955524094, 'subsample': 0.8430179407605753, 'colsample_bytree': 0.6682096494749166, 'min_child_weight': 1, 'gamma': 4.7444276862666666, 'reg_alpha': 1.9312640661491187, 'reg_lambda': 1.6167946962329223}
Best xgb F1 score (positive class): 0.6261


[I 2025-09-02 01:42:16,239] A new study created in memory with name: no-name-fbeae945-66c1-45f9-aca9-7791ee210eed
[I 2025-09-02 01:42:16,268] Trial 0 finished with value: 0.5218946683123028 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5218946683123028.


xgb test accuracy: 0.7292
xgb test F1 (positive): 0.6701

--- Optimizing DT ---


[I 2025-09-02 01:42:16,492] Trial 1 finished with value: 0.4939397306039153 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5218946683123028.
[I 2025-09-02 01:42:16,521] Trial 2 finished with value: 0.5526431387492378 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5526431387492378.
[I 2025-09-02 01:42:16,544] Trial 3 finished with value: 0.5336097047961454 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5526431387492378.
[I 2025-09-02 01:42:16,565] Trial 4 finished with value: 0.6703462775103386 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 17, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6728
dt test accuracy: 0.7292
dt test F1 (positive): 0.7137

OUTER FOLD 4/5
Train size: 924, Test size: 224
Class distribution in test set: {'non-void': np.int64(119), 'void': np.int64(105)}

--- Optimizing RF ---


[I 2025-09-02 01:42:20,987] Trial 0 finished with value: 0.5470056710464762 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5470056710464762.
[I 2025-09-02 01:42:22,105] Trial 1 finished with value: 0.6159720677117195 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6159720677117195.
[I 2025-09-02 01:42:26,361] Trial 2 finished with value: 0.5716552228608528 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6159720677117195.
[I 2025-09-02 01:42:30,638] Trial 3 finished with value: 0.549092987263737 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6160


[I 2025-09-02 01:43:59,289] A new study created in memory with name: no-name-7d3c14f8-f9c7-4518-a207-feab3a2f6c2d


rf test accuracy: 0.7500
rf test F1 (positive): 0.6989

--- Optimizing XGB ---


[I 2025-09-02 01:44:01,461] Trial 0 finished with value: 0.5183396488313097 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5183396488313097.
[I 2025-09-02 01:44:03,250] Trial 1 finished with value: 0.5099968701095462 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5183396488313097.
[I 2025-09-02 01:44:04,797] Trial 2 finished with value: 0.5112285842506797 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 92, 'max_depth': 3, 'learning_rate': 0.020626112753573914, 'subsample': 0.9556507914974237, 'colsample_bytree': 0.9700349154403322, 'min_child_weight': 3, 'gamma': 4.787916536971173, 'reg_alpha': 1.014800649584465, 'reg_lambda': 1.5169671153739943}
Best xgb F1 score (positive class): 0.5931


[I 2025-09-02 01:45:33,307] A new study created in memory with name: no-name-11e78c3b-c1b5-4bd7-99b0-33829ed3ff73
[I 2025-09-02 01:45:33,339] Trial 0 finished with value: 0.5311327649562944 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5311327649562944.


xgb test accuracy: 0.7321
xgb test F1 (positive): 0.6809

--- Optimizing DT ---


[I 2025-09-02 01:45:33,561] Trial 1 finished with value: 0.5470978218765831 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5470978218765831.
[I 2025-09-02 01:45:33,594] Trial 2 finished with value: 0.5642500799043927 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5642500799043927.
[I 2025-09-02 01:45:33,615] Trial 3 finished with value: 0.5807978363759296 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.5807978363759296.
[I 2025-09-02 01:45:33,635] Trial 4 finished with value: 0.5765159018159921 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6434
dt test accuracy: 0.7188
dt test F1 (positive): 0.6557

OUTER FOLD 5/5
Train size: 873, Test size: 275
Class distribution in test set: {'non-void': np.int64(157), 'void': np.int64(118)}

--- Optimizing RF ---


[I 2025-09-02 01:45:36,273] Trial 0 finished with value: 0.623094178873405 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.623094178873405.
[I 2025-09-02 01:45:37,444] Trial 1 finished with value: 0.6529839986485478 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6529839986485478.
[I 2025-09-02 01:45:41,352] Trial 2 finished with value: 0.6511852239986027 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6529839986485478.
[I 2025-09-02 01:45:45,157] Trial 3 finished with value: 0.6373283889004413 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features'

Best rf params: {'n_estimators': 455, 'max_depth': 3, 'min_samples_split': 13, 'min_samples_leaf': 4, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6578


[I 2025-09-02 01:47:19,839] A new study created in memory with name: no-name-94b226fa-f8ff-4203-8204-8a40bd6d5b4d


rf test accuracy: 0.6655
rf test F1 (positive): 0.6230

--- Optimizing XGB ---


[I 2025-09-02 01:47:21,848] Trial 0 finished with value: 0.5828573077145001 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5828573077145001.
[I 2025-09-02 01:47:23,611] Trial 1 finished with value: 0.5871164065913929 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5871164065913929.
[I 2025-09-02 01:47:25,282] Trial 2 finished with value: 0.5934112985374919 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 296, 'max_depth': 9, 'learning_rate': 0.09448858344160434, 'subsample': 0.8400436450707932, 'colsample_bytree': 0.6271422062258899, 'min_child_weight': 1, 'gamma': 4.733148171976474, 'reg_alpha': 1.4918437100130293, 'reg_lambda': 1.6641812089168282}
Best xgb F1 score (positive class): 0.6572


[I 2025-09-02 01:48:46,581] A new study created in memory with name: no-name-161dd273-7c58-451d-84c6-fd377530c527
[I 2025-09-02 01:48:46,611] Trial 0 finished with value: 0.5385572227111778 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5385572227111778.


xgb test accuracy: 0.6764
xgb test F1 (positive): 0.6307

--- Optimizing DT ---


[I 2025-09-02 01:48:46,806] Trial 1 finished with value: 0.5292021513601256 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5385572227111778.
[I 2025-09-02 01:48:46,835] Trial 2 finished with value: 0.6075076386588089 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6075076386588089.
[I 2025-09-02 01:48:46,857] Trial 3 finished with value: 0.6321261394432126 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6321261394432126.
[I 2025-09-02 01:48:46,878] Trial 4 finished with value: 0.3903837454023327 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 10, 'min_samples_leaf': 9, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6506
dt test accuracy: 0.6909
dt test F1 (positive): 0.6863

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7019 Â± 0.0772
f1_positive       : 0.6211 Â± 0.1300
precision_positive: 0.6428 Â± 0.1348
recall_positive   : 0.6074 Â± 0.1455
f1_macro          : 0.6864 Â± 0.0903
Individual fold accuracies: ['0.7822', '0.5870', '0.7250', '0.7500', '0.6655']
Individual fold F1 (pos): ['0.7135', '0.3968', '0.6733', '0.6989', '0.6230']

XGB Results:
----------------------------------------
accuracy          : 0.6994 Â± 0.0450
f1_positive       : 0.6023 Â± 0.0882
precision_positive: 0.6607 Â± 0.1034
recall_positive   : 0.5650 Â± 0.1197
f1_macro          : 0.6784 Â± 0.0532
Individual fold accuracies: ['0.7289', '0.6304', '0.7

[I 2025-09-02 01:48:50,204] Trial 0 finished with value: 0.6000726216412491 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6000726216412491.
[I 2025-09-02 01:48:51,900] Trial 1 finished with value: 0.6384107296968718 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6384107296968718.
[I 2025-09-02 01:49:02,938] Trial 2 finished with value: 0.6120310723758999 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6384107296968718.
[I 2025-09-02 01:49:16,438] Trial 3 finished with value: 0.60147962354874 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features'

Best rf params: {'n_estimators': 362, 'max_depth': 4, 'min_samples_split': 10, 'min_samples_leaf': 6, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6622


[I 2025-09-02 01:56:16,879] A new study created in memory with name: no-name-8ccc1f45-3d3c-47c3-95be-59734b7c1453


rf test accuracy: 0.7042
rf test F1 (positive): 0.6071

--- Optimizing XGB ---


[I 2025-09-02 01:56:20,083] Trial 0 finished with value: 0.5821670643243856 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5821670643243856.
[I 2025-09-02 01:56:22,355] Trial 1 finished with value: 0.5859705193410721 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5859705193410721.
[I 2025-09-02 01:56:24,396] Trial 2 finished with value: 0.5756255381554397 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 117, 'max_depth': 3, 'learning_rate': 0.013385150015494653, 'subsample': 0.7085165410558034, 'colsample_bytree': 0.9584340763859297, 'min_child_weight': 8, 'gamma': 0.9972667530342793, 'reg_alpha': 1.9639697805099092, 'reg_lambda': 0.1127065373299995}
Best xgb F1 score (positive class): 0.6462


[I 2025-09-02 01:59:23,608] A new study created in memory with name: no-name-cbc00620-bf51-43bb-9f1b-f00bb488a7d5
[I 2025-09-02 01:59:23,663] Trial 0 finished with value: 0.5600547789840457 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5600547789840457.


xgb test accuracy: 0.7462
xgb test F1 (positive): 0.6607

--- Optimizing DT ---


[I 2025-09-02 01:59:24,244] Trial 1 finished with value: 0.483100778136292 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5600547789840457.
[I 2025-09-02 01:59:24,297] Trial 2 finished with value: 0.5657494974041015 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5657494974041015.
[I 2025-09-02 01:59:24,330] Trial 3 finished with value: 0.642906988198236 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.642906988198236.
[I 2025-09-02 01:59:24,359] Trial 4 finished with value: 0.6590662692673117 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_fea

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 17, 'min_samples_leaf': 5, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6657
dt test accuracy: 0.7529
dt test F1 (positive): 0.6839

OUTER FOLD 2/5
Train size: 2246, Test size: 609
Class distribution in test set: {'non-void': np.int64(358), 'void': np.int64(251)}

--- Optimizing RF ---


[I 2025-09-02 01:59:32,739] Trial 0 finished with value: 0.6745394800224488 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6745394800224488.
[I 2025-09-02 01:59:34,472] Trial 1 finished with value: 0.6800386550549232 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6800386550549232.
[I 2025-09-02 01:59:45,871] Trial 2 finished with value: 0.6546135913041091 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6800386550549232.
[I 2025-09-02 01:59:58,825] Trial 3 finished with value: 0.6402358457938376 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 226, 'max_depth': 3, 'min_samples_split': 17, 'min_samples_leaf': 6, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6920


[I 2025-09-02 02:05:13,825] A new study created in memory with name: no-name-8772c3f9-67d3-4bb8-a585-88ccc8666c43


rf test accuracy: 0.6601
rf test F1 (positive): 0.6362

--- Optimizing XGB ---


[I 2025-09-02 02:05:17,031] Trial 0 finished with value: 0.6200960334809333 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6200960334809333.
[I 2025-09-02 02:05:19,231] Trial 1 finished with value: 0.5946358086234499 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6200960334809333.
[I 2025-09-02 02:05:21,571] Trial 2 finished with value: 0.6174528660194765 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 59, 'max_depth': 3, 'learning_rate': 0.026081210767269766, 'subsample': 0.6311631983195253, 'colsample_bytree': 0.8875328199700073, 'min_child_weight': 7, 'gamma': 0.7502249159582844, 'reg_alpha': 0.6066132027165467, 'reg_lambda': 1.2674105051583902}
Best xgb F1 score (positive class): 0.6802
xgb test accuracy: 0.7011
xgb test F1 (positive): 0.6445

--- Optimizing DT ---


[I 2025-09-02 02:07:12,734] A new study created in memory with name: no-name-17886764-4f56-448c-a020-ba83f6abe3ee
[I 2025-09-02 02:07:12,783] Trial 0 finished with value: 0.5358382885555072 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5358382885555072.
[I 2025-09-02 02:07:13,358] Trial 1 finished with value: 0.5505459150126449 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5505459150126449.
[I 2025-09-02 02:07:13,408] Trial 2 finished with value: 0.6408132770583417 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6408132770583417.
[I 2025-09-02 02:07:13,440] Trial 3 finished with value: 0.6232143705

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 17, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6779
dt test accuracy: 0.6913
dt test F1 (positive): 0.5785

OUTER FOLD 3/5
Train size: 2285, Test size: 570
Class distribution in test set: {'non-void': np.int64(271), 'void': np.int64(299)}

--- Optimizing RF ---


[I 2025-09-02 02:07:22,129] Trial 0 finished with value: 0.5629849472377405 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5629849472377405.
[I 2025-09-02 02:07:23,885] Trial 1 finished with value: 0.6010650973430688 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6010650973430688.
[I 2025-09-02 02:07:35,684] Trial 2 finished with value: 0.5441967881426383 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6010650973430688.
[I 2025-09-02 02:07:49,234] Trial 3 finished with value: 0.5534307815482006 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 289, 'max_depth': 3, 'min_samples_split': 6, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}
Best rf F1 score (positive class): 0.6273


[I 2025-09-02 02:10:31,037] A new study created in memory with name: no-name-8cd5dff0-c4e1-4a22-bdca-9247c0e2fbd7


rf test accuracy: 0.6877
rf test F1 (positive): 0.6337

--- Optimizing XGB ---


[I 2025-09-02 02:10:34,122] Trial 0 finished with value: 0.5415698317292367 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5415698317292367.
[I 2025-09-02 02:10:36,333] Trial 1 finished with value: 0.5507508197303156 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5507508197303156.
[I 2025-09-02 02:10:38,410] Trial 2 finished with value: 0.5665681512182726 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 240, 'max_depth': 3, 'learning_rate': 0.014708957428729979, 'subsample': 0.8352045763221544, 'colsample_bytree': 0.6976812553800048, 'min_child_weight': 2, 'gamma': 2.345775160917182, 'reg_alpha': 0.4577880727857463, 'reg_lambda': 1.4802712522755255}
Best xgb F1 score (positive class): 0.6184


[I 2025-09-02 02:12:42,034] A new study created in memory with name: no-name-4fc90da4-e900-42a5-8c01-727bc230a618
[I 2025-09-02 02:12:42,086] Trial 0 finished with value: 0.4928576107805464 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4928576107805464.


xgb test accuracy: 0.7140
xgb test F1 (positive): 0.6720

--- Optimizing DT ---


[I 2025-09-02 02:12:42,683] Trial 1 finished with value: 0.4721871131596697 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.4928576107805464.
[I 2025-09-02 02:12:42,736] Trial 2 finished with value: 0.49328240588270483 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.49328240588270483.
[I 2025-09-02 02:12:42,768] Trial 3 finished with value: 0.6286562506278919 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6286562506278919.
[I 2025-09-02 02:12:42,797] Trial 4 finished with value: 0.41919492516965273 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'm

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6604
dt test accuracy: 0.6789
dt test F1 (positive): 0.6288

OUTER FOLD 4/5
Train size: 2299, Test size: 556
Class distribution in test set: {'non-void': np.int64(350), 'void': np.int64(206)}

--- Optimizing RF ---


[I 2025-09-02 02:12:47,001] Trial 0 finished with value: 0.5661632062295671 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5661632062295671.
[I 2025-09-02 02:12:48,695] Trial 1 finished with value: 0.6120584280650289 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6120584280650289.
[I 2025-09-02 02:12:59,271] Trial 2 finished with value: 0.5586604168812884 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6120584280650289.
[I 2025-09-02 02:13:11,559] Trial 3 finished with value: 0.5489686645292825 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6121


[I 2025-09-02 02:16:03,802] A new study created in memory with name: no-name-2fdc1ddd-b04c-4437-ac69-660fc6715147


rf test accuracy: 0.8112
rf test F1 (positive): 0.7826

--- Optimizing XGB ---


[I 2025-09-02 02:16:07,293] Trial 0 finished with value: 0.5456391095760992 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5456391095760992.
[I 2025-09-02 02:16:09,504] Trial 1 finished with value: 0.5230522452726406 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5456391095760992.
[I 2025-09-02 02:16:11,635] Trial 2 finished with value: 0.5482122454300709 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 427, 'max_depth': 6, 'learning_rate': 0.06891126480124775, 'subsample': 0.6169612157954633, 'colsample_bytree': 0.6999164353733937, 'min_child_weight': 9, 'gamma': 4.9752182664454105, 'reg_alpha': 1.8662091623522938, 'reg_lambda': 0.22271228250458774}
Best xgb F1 score (positive class): 0.5782


[I 2025-09-02 02:19:05,016] A new study created in memory with name: no-name-fa11bd01-b62b-4074-bf52-a186fcd06253
[I 2025-09-02 02:19:05,067] Trial 0 finished with value: 0.44651826841998493 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.44651826841998493.


xgb test accuracy: 0.8112
xgb test F1 (positive): 0.7835

--- Optimizing DT ---


[I 2025-09-02 02:19:05,661] Trial 1 finished with value: 0.5265541792936788 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5265541792936788.
[I 2025-09-02 02:19:05,712] Trial 2 finished with value: 0.5480026817590965 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5480026817590965.
[I 2025-09-02 02:19:05,743] Trial 3 finished with value: 0.5745149384708472 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.5745149384708472.
[I 2025-09-02 02:19:05,770] Trial 4 finished with value: 0.6246986364246289 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6371
dt test accuracy: 0.7302
dt test F1 (positive): 0.7024

OUTER FOLD 5/5
Train size: 2330, Test size: 525
Class distribution in test set: {'non-void': np.int64(276), 'void': np.int64(249)}

--- Optimizing RF ---


[I 2025-09-02 02:19:10,200] Trial 0 finished with value: 0.6008611931931971 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6008611931931971.
[I 2025-09-02 02:19:11,989] Trial 1 finished with value: 0.6571990940839129 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6571990940839129.
[I 2025-09-02 02:19:23,803] Trial 2 finished with value: 0.6193741665439778 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6571990940839129.
[I 2025-09-02 02:19:37,764] Trial 3 finished with value: 0.6121591909198933 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 211, 'max_depth': 3, 'min_samples_split': 19, 'min_samples_leaf': 10, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6816


[I 2025-09-02 02:24:26,794] A new study created in memory with name: no-name-d1619f6e-d915-4f21-a1f9-cc3939232211


rf test accuracy: 0.6610
rf test F1 (positive): 0.6454

--- Optimizing XGB ---


[I 2025-09-02 02:24:29,857] Trial 0 finished with value: 0.5876538135679895 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5876538135679895.
[I 2025-09-02 02:24:32,036] Trial 1 finished with value: 0.5569883573676342 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5876538135679895.
[I 2025-09-02 02:24:34,106] Trial 2 finished with value: 0.5954544351110287 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 216, 'max_depth': 3, 'learning_rate': 0.012659669619196259, 'subsample': 0.8278316372613039, 'colsample_bytree': 0.694572380303584, 'min_child_weight': 9, 'gamma': 0.12695282557417278, 'reg_alpha': 1.267099305139135, 'reg_lambda': 1.7916690508747795}
Best xgb F1 score (positive class): 0.6351


[I 2025-09-02 02:27:46,100] A new study created in memory with name: no-name-7da62eba-8f8a-496b-b5d1-60ecf7204ef5
[I 2025-09-02 02:27:46,152] Trial 0 finished with value: 0.5253980930852881 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5253980930852881.


xgb test accuracy: 0.6610
xgb test F1 (positive): 0.6322

--- Optimizing DT ---


[I 2025-09-02 02:27:46,745] Trial 1 finished with value: 0.5656252012599773 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5656252012599773.
[I 2025-09-02 02:27:46,799] Trial 2 finished with value: 0.5705019209120533 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5705019209120533.
[I 2025-09-02 02:27:46,832] Trial 3 finished with value: 0.6397499325457751 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6397499325457751.
[I 2025-09-02 02:27:46,861] Trial 4 finished with value: 0.41338030666532805 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max

Best dt params: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 13, 'min_samples_leaf': 5, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6824
dt test accuracy: 0.6514
dt test F1 (positive): 0.6405

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7048 Â± 0.0623
f1_positive       : 0.6610 Â± 0.0694
precision_positive: 0.6550 Â± 0.1070
recall_positive   : 0.6935 Â± 0.1462
f1_macro          : 0.6985 Â± 0.0623
Individual fold accuracies: ['0.7042', '0.6601', '0.6877', '0.8112', '0.6610']
Individual fold F1 (pos): ['0.6071', '0.6362', '0.6337', '0.7826', '0.6454']

XGB Results:
----------------------------------------
accuracy          : 0.7267 Â± 0.0562
f1_positive       : 0.6786 Â± 0.0606
precision_positive: 0.6840 Â± 0.0926
recall_positive   : 0.6940 Â± 0.1403
f1_macro          : 0.7197 Â± 0.0557
Individual fold accuracies: ['0.7462', '0.7011', '0.7

[I 2025-09-02 02:27:54,392] Trial 0 finished with value: 0.6123015873015873 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6123015873015873.
[I 2025-09-02 02:27:55,308] Trial 1 finished with value: 0.6256817680254737 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6256817680254737.
[I 2025-09-02 02:27:56,875] Trial 2 finished with value: 0.5810399278141213 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6256817680254737.
[I 2025-09-02 02:27:58,378] Trial 3 finished with value: 0.6029482609114558 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 100, 'max_depth': 4, 'min_samples_split': 12, 'min_samples_leaf': 2, 'max_features': 'log2', 'bootstrap': True}
Best rf F1 score (positive class): 0.6465
rf test accuracy: 0.7797
rf test F1 (positive): 0.7111

--- Optimizing XGB ---


[I 2025-09-02 02:28:32,753] Trial 0 finished with value: 0.607496866006321 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.607496866006321.
[I 2025-09-02 02:28:34,349] Trial 1 finished with value: 0.5876006441223832 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.607496866006321.
[I 2025-09-02 02:28:35,400] Trial 2 finished with value: 0.6020906464168876 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.655

Best xgb params: {'n_estimators': 484, 'max_depth': 8, 'learning_rate': 0.01980745776609054, 'subsample': 0.9986738459939086, 'colsample_bytree': 0.8212713156959469, 'min_child_weight': 6, 'gamma': 4.5343687078629396, 'reg_alpha': 1.1510985611864628, 'reg_lambda': 1.3363971375574248}
Best xgb F1 score (positive class): 0.6484


[I 2025-09-02 02:29:56,721] A new study created in memory with name: no-name-58fa64dc-31fe-4d68-91b6-e5c38a464d90
[I 2025-09-02 02:29:56,742] Trial 0 finished with value: 0.5168093668466152 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5168093668466152.
[I 2025-09-02 02:29:56,820] Trial 1 finished with value: 0.5251709051134811 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5251709051134811.
[I 2025-09-02 02:29:56,840] Trial 2 finished with value: 0.5236424394319131 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5251709051134811.
[I 2025-09-02 02:29:56,857] Trial 3 finished with value: 0.5342140888

xgb test accuracy: 0.7797
xgb test F1 (positive): 0.6750

--- Optimizing DT ---


[I 2025-09-02 02:29:56,928] Trial 7 finished with value: 0.578072136872749 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 4 with value: 0.6247524752475248.
[I 2025-09-02 02:29:56,946] Trial 8 finished with value: 0.43724472135687087 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 4 with value: 0.6247524752475248.
[I 2025-09-02 02:29:56,964] Trial 9 finished with value: 0.40731204789373426 and parameters: {'criterion': 'entropy', 'max_depth': 16, 'min_samples_split': 12, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'random'}. Best is trial 4 with value: 0.6247524752475248.
[I 2025-09-02 02:29:56,994] Trial 10 finished with value: 0.5947671002142011 and parameters: {'criterion': 'entropy', 'max_depth': 11, 'min_samples_split': 15, 'min_samples_leaf': 1

Best dt params: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 17, 'min_samples_leaf': 7, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6827
dt test accuracy: 0.7288
dt test F1 (positive): 0.6279

OUTER FOLD 2/5
Train size: 361, Test size: 104
Class distribution in test set: {'non-void': np.int64(59), 'void': np.int64(45)}

--- Optimizing RF ---


[I 2025-09-02 02:29:59,354] Trial 0 finished with value: 0.6240457080136027 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6240457080136027.
[I 2025-09-02 02:30:00,242] Trial 1 finished with value: 0.6060086834776368 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 0 with value: 0.6240457080136027.
[I 2025-09-02 02:30:01,761] Trial 2 finished with value: 0.6202318754042891 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 0 with value: 0.6240457080136027.
[I 2025-09-02 02:30:03,255] Trial 3 finished with value: 0.6234753550543024 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 223, 'max_depth': 13, 'min_samples_split': 20, 'min_samples_leaf': 4, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6565


[I 2025-09-02 02:31:18,985] A new study created in memory with name: no-name-c5b32e54-7761-417c-8461-2ebb1a80fc75


rf test accuracy: 0.7596
rf test F1 (positive): 0.7059

--- Optimizing XGB ---


[I 2025-09-02 02:31:20,056] Trial 0 finished with value: 0.5945717915951793 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5945717915951793.
[I 2025-09-02 02:31:21,624] Trial 1 finished with value: 0.5853901996370235 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5945717915951793.
[I 2025-09-02 02:31:22,553] Trial 2 finished with value: 0.5941402755412417 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 210, 'max_depth': 5, 'learning_rate': 0.06333268775321842, 'subsample': 0.6563696899899051, 'colsample_bytree': 0.9208787923016158, 'min_child_weight': 1, 'gamma': 4.9344346830025865, 'reg_alpha': 1.5444895385933148, 'reg_lambda': 0.3974313630683448}
Best xgb F1 score (positive class): 0.6612


[I 2025-09-02 02:32:26,624] A new study created in memory with name: no-name-f489dfed-9367-44dd-8660-fd4720b4ee39
[I 2025-09-02 02:32:26,646] Trial 0 finished with value: 0.4274172790301823 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4274172790301823.
[I 2025-09-02 02:32:26,722] Trial 1 finished with value: 0.5702984283392875 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5702984283392875.
[I 2025-09-02 02:32:26,741] Trial 2 finished with value: 0.49829829829829825 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5702984283392875.
[I 2025-09-02 02:32:26,758] Trial 3 finished with value: 0.524425178

xgb test accuracy: 0.7115
xgb test F1 (positive): 0.6341

--- Optimizing DT ---


[I 2025-09-02 02:32:26,829] Trial 7 finished with value: 0.6128796910118857 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 5 with value: 0.6258096441975091.
[I 2025-09-02 02:32:26,848] Trial 8 finished with value: 0.50953316231094 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 5 with value: 0.6258096441975091.
[I 2025-09-02 02:32:26,866] Trial 9 finished with value: 0.5879248924615273 and parameters: {'criterion': 'entropy', 'max_depth': 16, 'min_samples_split': 12, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'random'}. Best is trial 5 with value: 0.6258096441975091.
[I 2025-09-02 02:32:26,891] Trial 10 finished with value: 0.614064935763049 and parameters: {'criterion': 'gini', 'max_depth': 12, 'min_samples_split': 15, 'min_samples_leaf': 7, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 8, 'min_samples_split': 10, 'min_samples_leaf': 8, 'max_features': 'sqrt', 'splitter': 'random'}
Best dt F1 score (positive class): 0.6463
dt test accuracy: 0.6154
dt test F1 (positive): 0.4872

OUTER FOLD 3/5
Train size: 380, Test size: 85
Class distribution in test set: {'non-void': np.int64(49), 'void': np.int64(36)}

--- Optimizing RF ---


[I 2025-09-02 02:32:28,693] Trial 0 finished with value: 0.6431376470980431 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6431376470980431.
[I 2025-09-02 02:32:29,619] Trial 1 finished with value: 0.6556596540375258 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6556596540375258.
[I 2025-09-02 02:32:31,250] Trial 2 finished with value: 0.6465164252398296 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6556596540375258.
[I 2025-09-02 02:32:32,808] Trial 3 finished with value: 0.6598255009469962 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 376, 'max_depth': 3, 'min_samples_split': 5, 'min_samples_leaf': 7, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6620


[I 2025-09-02 02:33:34,158] A new study created in memory with name: no-name-5cc07214-6afb-4c84-9de7-f8f500581a1e


rf test accuracy: 0.6824
rf test F1 (positive): 0.5714

--- Optimizing XGB ---


[I 2025-09-02 02:33:35,659] Trial 0 finished with value: 0.6062268726872687 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6062268726872687.
[I 2025-09-02 02:33:37,395] Trial 1 finished with value: 0.5960083931098424 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6062268726872687.
[I 2025-09-02 02:33:38,392] Trial 2 finished with value: 0.6124135469929862 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 392, 'max_depth': 12, 'learning_rate': 0.025821988338135073, 'subsample': 0.6723548825969252, 'colsample_bytree': 0.7306136349663493, 'min_child_weight': 1, 'gamma': 4.71689757492779, 'reg_alpha': 1.87024476301938, 'reg_lambda': 0.11211254675572382}
Best xgb F1 score (positive class): 0.6528


[I 2025-09-02 02:34:53,931] A new study created in memory with name: no-name-651f8725-1053-401e-982d-18f85adf8abc
[I 2025-09-02 02:34:53,953] Trial 0 finished with value: 0.6314200100271666 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.6314200100271666.
[I 2025-09-02 02:34:54,033] Trial 1 finished with value: 0.5005316210271752 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.6314200100271666.
[I 2025-09-02 02:34:54,053] Trial 2 finished with value: 0.5561857429055764 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.6314200100271666.
[I 2025-09-02 02:34:54,071] Trial 3 finished with value: 0.5563787833

xgb test accuracy: 0.6824
xgb test F1 (positive): 0.5846

--- Optimizing DT ---


[I 2025-09-02 02:34:54,143] Trial 7 finished with value: 0.6518513436946585 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 7 with value: 0.6518513436946585.
[I 2025-09-02 02:34:54,164] Trial 8 finished with value: 0.506447027440212 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 7 with value: 0.6518513436946585.
[I 2025-09-02 02:34:54,182] Trial 9 finished with value: 0.5594358539572314 and parameters: {'criterion': 'entropy', 'max_depth': 16, 'min_samples_split': 12, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'random'}. Best is trial 7 with value: 0.6518513436946585.
[I 2025-09-02 02:34:54,210] Trial 10 finished with value: 0.5196324143692564 and parameters: {'criterion': 'gini', 'max_depth': 11, 'min_samples_split': 15, 'min_samples_leaf': 8, 'ma

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 18, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.7350
dt test accuracy: 0.6588
dt test F1 (positive): 0.5672

OUTER FOLD 4/5
Train size: 399, Test size: 66
Class distribution in test set: {'non-void': np.int64(31), 'void': np.int64(35)}

--- Optimizing RF ---


[I 2025-09-02 02:34:56,828] Trial 0 finished with value: 0.6526733500417711 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6526733500417711.
[I 2025-09-02 02:34:57,821] Trial 1 finished with value: 0.6391713947502714 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 0 with value: 0.6526733500417711.
[I 2025-09-02 02:34:59,516] Trial 2 finished with value: 0.6483935515535922 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 0 with value: 0.6526733500417711.
[I 2025-09-02 02:35:01,126] Trial 3 finished with value: 0.6467969165337587 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 458, 'max_depth': 11, 'min_samples_split': 8, 'min_samples_leaf': 4, 'max_features': 'log2', 'bootstrap': True}
Best rf F1 score (positive class): 0.6733


[I 2025-09-02 02:36:03,346] A new study created in memory with name: no-name-c369624c-af4e-4fac-9306-f64eea239b8c


rf test accuracy: 0.5455
rf test F1 (positive): 0.5000

--- Optimizing XGB ---


[I 2025-09-02 02:36:04,458] Trial 0 finished with value: 0.6536280233527939 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6536280233527939.
[I 2025-09-02 02:36:06,110] Trial 1 finished with value: 0.6607142857142857 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.6607142857142857.
[I 2025-09-02 02:36:07,134] Trial 2 finished with value: 0.6516032472746688 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 244, 'max_depth': 9, 'learning_rate': 0.16252032871377525, 'subsample': 0.7837800205477121, 'colsample_bytree': 0.7052870675495496, 'min_child_weight': 2, 'gamma': 1.005189194208213, 'reg_alpha': 1.4650857571370968, 'reg_lambda': 1.5028355633225892}
Best xgb F1 score (positive class): 0.6865


[I 2025-09-02 02:37:05,672] A new study created in memory with name: no-name-29d66368-8e31-4cb7-9a51-f5790bb1b8b6
[I 2025-09-02 02:37:05,694] Trial 0 finished with value: 0.566180339631667 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.566180339631667.
[I 2025-09-02 02:37:05,778] Trial 1 finished with value: 0.5905228758169935 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5905228758169935.
[I 2025-09-02 02:37:05,800] Trial 2 finished with value: 0.5923168971949461 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5923168971949461.
[I 2025-09-02 02:37:05,819] Trial 3 finished with value: 0.644269881865

xgb test accuracy: 0.5303
xgb test F1 (positive): 0.4918

--- Optimizing DT ---


[I 2025-09-02 02:37:05,877] Trial 6 finished with value: 0.5574795574795575 and parameters: {'criterion': 'gini', 'max_depth': 17, 'min_samples_split': 8, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'random'}. Best is trial 3 with value: 0.6442698818657898.
[I 2025-09-02 02:37:05,894] Trial 7 finished with value: 0.6687176743356519 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 7 with value: 0.6687176743356519.
[I 2025-09-02 02:37:05,916] Trial 8 finished with value: 0.518853930083755 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 7 with value: 0.6687176743356519.
[I 2025-09-02 02:37:05,933] Trial 9 finished with value: 0.6286659700452804 and parameters: {'criterion': 'entropy', 'max_depth': 16, 'min_samples_split': 12, 'min_samples_leaf': 8, 'max_fe

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 17, 'min_samples_leaf': 9, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6776
dt test accuracy: 0.6061
dt test F1 (positive): 0.5806

OUTER FOLD 5/5
Train size: 373, Test size: 92
Class distribution in test set: {'non-void': np.int64(59), 'void': np.int64(33)}

--- Optimizing RF ---


[I 2025-09-02 02:37:07,972] Trial 0 finished with value: 0.6359751008784382 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6359751008784382.
[I 2025-09-02 02:37:08,865] Trial 1 finished with value: 0.6373058044671644 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6373058044671644.
[I 2025-09-02 02:37:10,405] Trial 2 finished with value: 0.619485903814262 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6373058044671644.
[I 2025-09-02 02:37:11,905] Trial 3 finished with value: 0.6284808215040772 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 435, 'max_depth': 3, 'min_samples_split': 18, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6471


[I 2025-09-02 02:38:07,991] A new study created in memory with name: no-name-d4c447d6-006e-4e7c-8716-35ca109625bd


rf test accuracy: 0.7935
rf test F1 (positive): 0.7765

--- Optimizing XGB ---


[I 2025-09-02 02:38:09,941] Trial 0 finished with value: 0.6046525200177417 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6046525200177417.
[I 2025-09-02 02:38:11,541] Trial 1 finished with value: 0.6260360316259612 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.6260360316259612.
[I 2025-09-02 02:38:12,497] Trial 2 finished with value: 0.6039272196550346 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 476, 'max_depth': 9, 'learning_rate': 0.029323105618991638, 'subsample': 0.6071847502459278, 'colsample_bytree': 0.9924283304357214, 'min_child_weight': 7, 'gamma': 4.865188803848123, 'reg_alpha': 1.2481670543447305, 'reg_lambda': 0.07959921215402954}
Best xgb F1 score (positive class): 0.6399


[I 2025-09-02 02:39:30,728] A new study created in memory with name: no-name-921c3d02-1685-423d-baf2-f2846e48997e
[I 2025-09-02 02:39:30,749] Trial 0 finished with value: 0.596512377991392 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.596512377991392.
[I 2025-09-02 02:39:30,829] Trial 1 finished with value: 0.5393944244364413 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.596512377991392.
[I 2025-09-02 02:39:30,849] Trial 2 finished with value: 0.5592494168364485 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.596512377991392.
[I 2025-09-02 02:39:30,867] Trial 3 finished with value: 0.63237540773772

xgb test accuracy: 0.8261
xgb test F1 (positive): 0.7949

--- Optimizing DT ---


[I 2025-09-02 02:39:30,940] Trial 7 finished with value: 0.6585286749260706 and parameters: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 7 with value: 0.6585286749260706.
[I 2025-09-02 02:39:30,962] Trial 8 finished with value: 0.5477192021770875 and parameters: {'criterion': 'gini', 'max_depth': 7, 'min_samples_split': 3, 'min_samples_leaf': 4, 'max_features': 'log2', 'splitter': 'best'}. Best is trial 7 with value: 0.6585286749260706.
[I 2025-09-02 02:39:30,980] Trial 9 finished with value: 0.48430892340989024 and parameters: {'criterion': 'entropy', 'max_depth': 16, 'min_samples_split': 12, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'random'}. Best is trial 7 with value: 0.6585286749260706.
[I 2025-09-02 02:39:31,009] Trial 10 finished with value: 0.6128154408679494 and parameters: {'criterion': 'gini', 'max_depth': 11, 'min_samples_split': 15, 'min_samples_leaf': 8, '

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 14, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6776
dt test accuracy: 0.6630
dt test F1 (positive): 0.6804

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7121 Â± 0.1026
f1_positive       : 0.6530 Â± 0.1134
precision_positive: 0.6636 Â± 0.0556
recall_positive   : 0.6714 Â± 0.2261
f1_macro          : 0.7023 Â± 0.1028
Individual fold accuracies: ['0.7797', '0.7596', '0.6824', '0.5455', '0.7935']
Individual fold F1 (pos): ['0.7111', '0.7059', '0.5714', '0.5000', '0.7765']

XGB Results:
----------------------------------------
accuracy          : 0.7060 Â± 0.1133
f1_positive       : 0.6361 Â± 0.1120
precision_positive: 0.6668 Â± 0.0545
recall_positive   : 0.6233 Â± 0.1933
f1_macro          : 0.6931 Â± 0.1102
Individual fold accuracies: ['0.7797', '0.7115', '0

[I 2025-09-02 02:39:33,153] Trial 0 finished with value: 0.5504587155963303 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5504587155963303.
[I 2025-09-02 02:39:34,290] Trial 1 finished with value: 0.5533764533764534 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.5533764533764534.
[I 2025-09-02 02:39:37,963] Trial 2 finished with value: 0.5415733793092284 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.5533764533764534.
[I 2025-09-02 02:39:41,448] Trial 3 finished with value: 0.54193632217627 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features'

Best rf params: {'n_estimators': 126, 'max_depth': 4, 'min_samples_split': 7, 'min_samples_leaf': 1, 'max_features': 'sqrt', 'bootstrap': True}
Best rf F1 score (positive class): 0.5709
rf test accuracy: 0.7459
rf test F1 (positive): 0.7480

--- Optimizing XGB ---


[I 2025-09-02 02:40:35,003] Trial 0 finished with value: 0.5400087974114056 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5400087974114056.
[I 2025-09-02 02:40:36,806] Trial 1 finished with value: 0.5516795711811963 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5516795711811963.
[I 2025-09-02 02:40:38,291] Trial 2 finished with value: 0.5671225831973495 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.6557975442608167, 'colsample_bytree': 0.7168578594140873, 'min_child_weight': 4, 'gamma': 2.28034992108518, 'reg_alpha': 1.5703519227860272, 'reg_lambda': 0.39934756431671947}
Best xgb F1 score (positive class): 0.5671


[I 2025-09-02 02:42:02,802] A new study created in memory with name: no-name-5d41a789-0ed6-4063-998c-b12a065337b5
[I 2025-09-02 02:42:02,831] Trial 0 finished with value: 0.4404663026337204 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.4404663026337204.


xgb test accuracy: 0.5656
xgb test F1 (positive): 0.4752

--- Optimizing DT ---


[I 2025-09-02 02:42:03,007] Trial 1 finished with value: 0.500196050973253 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.500196050973253.
[I 2025-09-02 02:42:03,036] Trial 2 finished with value: 0.46937064912593285 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.500196050973253.
[I 2025-09-02 02:42:03,058] Trial 3 finished with value: 0.47036590734546063 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.500196050973253.
[I 2025-09-02 02:42:03,078] Trial 4 finished with value: 0.32890167252583363 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_f

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6716
dt test accuracy: 0.6721
dt test F1 (positive): 0.7500

OUTER FOLD 2/5
Train size: 732, Test size: 173
Class distribution in test set: {'non-void': np.int64(100), 'void': np.int64(73)}

--- Optimizing RF ---


[I 2025-09-02 02:42:06,616] Trial 0 finished with value: 0.6721013142902207 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6721013142902207.
[I 2025-09-02 02:42:07,581] Trial 1 finished with value: 0.6779202736143696 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6779202736143696.
[I 2025-09-02 02:42:10,669] Trial 2 finished with value: 0.6579806687565308 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6779202736143696.
[I 2025-09-02 02:42:13,695] Trial 3 finished with value: 0.6501944948443349 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 458, 'max_depth': 5, 'min_samples_split': 16, 'min_samples_leaf': 1, 'max_features': 'log2', 'bootstrap': True}
Best rf F1 score (positive class): 0.7004


[I 2025-09-02 02:43:35,985] A new study created in memory with name: no-name-fdebe3d2-6f9c-4c5e-9694-e4496806a3e4


rf test accuracy: 0.5780
rf test F1 (positive): 0.4341

--- Optimizing XGB ---


[I 2025-09-02 02:43:37,876] Trial 0 finished with value: 0.6409351204975845 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6409351204975845.
[I 2025-09-02 02:43:39,529] Trial 1 finished with value: 0.6403690837721119 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6409351204975845.
[I 2025-09-02 02:43:40,705] Trial 2 finished with value: 0.6351459091363485 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 448, 'max_depth': 9, 'learning_rate': 0.018655304848837168, 'subsample': 0.6921895407093429, 'colsample_bytree': 0.7311941285873849, 'min_child_weight': 10, 'gamma': 2.696132260582253, 'reg_alpha': 1.453929503576089, 'reg_lambda': 1.408398037906978}
Best xgb F1 score (positive class): 0.6816


[I 2025-09-02 02:45:12,963] A new study created in memory with name: no-name-8cbbc885-21b7-472f-9051-8953dd6d661c
[I 2025-09-02 02:45:12,990] Trial 0 finished with value: 0.551947665774606 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.551947665774606.
[I 2025-09-02 02:45:13,149] Trial 1 finished with value: 0.5943565511655163 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5943565511655163.


xgb test accuracy: 0.6243
xgb test F1 (positive): 0.4882

--- Optimizing DT ---


[I 2025-09-02 02:45:13,176] Trial 2 finished with value: 0.5995970063327576 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5995970063327576.
[I 2025-09-02 02:45:13,198] Trial 3 finished with value: 0.6123164702543652 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6123164702543652.
[I 2025-09-02 02:45:13,219] Trial 4 finished with value: 0.4094198144611452 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6123164702543652.
[I 2025-09-02 02:45:13,245] Trial 5 finished with value: 0.5421809490223738 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 5, 'min_samples_split': 10, 'min_samples_leaf': 7, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.7040
dt test accuracy: 0.6474
dt test F1 (positive): 0.5414

OUTER FOLD 3/5
Train size: 620, Test size: 285
Class distribution in test set: {'non-void': np.int64(184), 'void': np.int64(101)}

--- Optimizing RF ---


[I 2025-09-02 02:45:16,244] Trial 0 finished with value: 0.5764118957667345 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5764118957667345.
[I 2025-09-02 02:45:17,228] Trial 1 finished with value: 0.618558201058201 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.618558201058201.
[I 2025-09-02 02:45:20,085] Trial 2 finished with value: 0.6034335393242354 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.618558201058201.
[I 2025-09-02 02:45:22,789] Trial 3 finished with value: 0.5935130159598511 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features':

Best rf params: {'n_estimators': 232, 'max_depth': 3, 'min_samples_split': 7, 'min_samples_leaf': 1, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6774


[I 2025-09-02 02:46:18,343] A new study created in memory with name: no-name-96ccf5c9-5106-4e3f-b636-795d113ae99b


rf test accuracy: 0.7825
rf test F1 (positive): 0.7130

--- Optimizing XGB ---


[I 2025-09-02 02:46:20,101] Trial 0 finished with value: 0.5614930209622718 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5614930209622718.
[I 2025-09-02 02:46:21,822] Trial 1 finished with value: 0.5841247876710592 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5841247876710592.
[I 2025-09-02 02:46:22,993] Trial 2 finished with value: 0.590265867949341 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.6

Best xgb params: {'n_estimators': 397, 'max_depth': 4, 'learning_rate': 0.1355236375958329, 'subsample': 0.963903899549204, 'colsample_bytree': 0.9028757172342523, 'min_child_weight': 2, 'gamma': 3.309347582059922, 'reg_alpha': 1.5924993373856797, 'reg_lambda': 1.4734345975348482}
Best xgb F1 score (positive class): 0.6171


[I 2025-09-02 02:47:31,921] A new study created in memory with name: no-name-de66c353-f033-475e-aae3-c3e412782d9e
[I 2025-09-02 02:47:31,946] Trial 0 finished with value: 0.5166096206418473 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5166096206418473.
[I 2025-09-02 02:47:32,087] Trial 1 finished with value: 0.5314764377694884 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5314764377694884.
[I 2025-09-02 02:47:32,110] Trial 2 finished with value: 0.6335511406044322 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6335511406044322.


xgb test accuracy: 0.7053
xgb test F1 (positive): 0.5385

--- Optimizing DT ---


[I 2025-09-02 02:47:32,130] Trial 3 finished with value: 0.5466003414365004 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6335511406044322.
[I 2025-09-02 02:47:32,149] Trial 4 finished with value: 0.6477884232282484 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 4 with value: 0.6477884232282484.
[I 2025-09-02 02:47:32,167] Trial 5 finished with value: 0.5669345333761919 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'splitter': 'random'}. Best is trial 4 with value: 0.6477884232282484.
[I 2025-09-02 02:47:32,191] Trial 6 finished with value: 0.5182193182193182 and parameters: {'criterion': 'gini', 'max_depth': 17, 'min_samples_split': 8, 'min_samples_leaf': 3, 'm

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 8, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6665
dt test accuracy: 0.7158
dt test F1 (positive): 0.5714

OUTER FOLD 4/5
Train size: 749, Test size: 156
Class distribution in test set: {'non-void': np.int64(99), 'void': np.int64(57)}

--- Optimizing RF ---


[I 2025-09-02 02:47:34,368] Trial 0 finished with value: 0.5875248329666282 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.5875248329666282.
[I 2025-09-02 02:47:35,440] Trial 1 finished with value: 0.6077157593056716 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6077157593056716.
[I 2025-09-02 02:47:38,789] Trial 2 finished with value: 0.5472658295254414 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6077157593056716.
[I 2025-09-02 02:47:41,955] Trial 3 finished with value: 0.5609978844377322 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6077


[I 2025-09-02 02:48:58,362] A new study created in memory with name: no-name-fe69c109-42e0-4f80-ae0c-4a868709b560


rf test accuracy: 0.8397
rf test F1 (positive): 0.7863

--- Optimizing XGB ---


[I 2025-09-02 02:49:00,331] Trial 0 finished with value: 0.5533261544277409 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5533261544277409.
[I 2025-09-02 02:49:02,049] Trial 1 finished with value: 0.5568531161416538 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.5568531161416538.
[I 2025-09-02 02:49:03,294] Trial 2 finished with value: 0.5561768600106386 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 91, 'max_depth': 7, 'learning_rate': 0.15921728208236582, 'subsample': 0.8460815217831401, 'colsample_bytree': 0.8766303188631278, 'min_child_weight': 10, 'gamma': 4.224782501117531, 'reg_alpha': 0.279440539555202, 'reg_lambda': 0.00790794150014204}
Best xgb F1 score (positive class): 0.6189
xgb test accuracy: 0.7628
xgb test F1 (positive): 0.6891

--- Optimizing DT ---


[I 2025-09-02 02:50:14,911] Trial 1 finished with value: 0.5251796868912734 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5291396955804654.
[I 2025-09-02 02:50:14,938] Trial 2 finished with value: 0.5481352816437602 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5481352816437602.
[I 2025-09-02 02:50:14,960] Trial 3 finished with value: 0.5125896231159389 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5481352816437602.
[I 2025-09-02 02:50:14,979] Trial 4 finished with value: 0.42010342598577893 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 16, 'min_samples_leaf': 9, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6382
dt test accuracy: 0.7949
dt test F1 (positive): 0.6981

OUTER FOLD 5/5
Train size: 736, Test size: 169
Class distribution in test set: {'non-void': np.int64(95), 'void': np.int64(74)}

--- Optimizing RF ---


[I 2025-09-02 02:50:17,444] Trial 0 finished with value: 0.6192393789198848 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6192393789198848.
[I 2025-09-02 02:50:18,571] Trial 1 finished with value: 0.6400931741965669 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6400931741965669.
[I 2025-09-02 02:50:21,924] Trial 2 finished with value: 0.5939859951382086 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6400931741965669.
[I 2025-09-02 02:50:25,058] Trial 3 finished with value: 0.6181033796651171 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 494, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6447


[I 2025-09-02 02:51:39,887] A new study created in memory with name: no-name-becb5027-ff6c-4f0d-9a5d-e407b97fde5c


rf test accuracy: 0.6746
rf test F1 (positive): 0.6707

--- Optimizing XGB ---


[I 2025-09-02 02:51:41,870] Trial 0 finished with value: 0.579180760352146 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.579180760352146.
[I 2025-09-02 02:51:43,637] Trial 1 finished with value: 0.6018467178250879 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.6018467178250879.
[I 2025-09-02 02:51:45,130] Trial 2 finished with value: 0.5863229617825688 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.65

Best xgb params: {'n_estimators': 383, 'max_depth': 11, 'learning_rate': 0.010247934625236994, 'subsample': 0.6833315450782069, 'colsample_bytree': 0.959158475403689, 'min_child_weight': 8, 'gamma': 3.498641297803042, 'reg_alpha': 0.770373344695678, 'reg_lambda': 0.21707255991544044}
Best xgb F1 score (positive class): 0.6239


[I 2025-09-02 02:53:25,132] A new study created in memory with name: no-name-18f7a81b-b30c-4c0f-9ecf-16642616cbfe
[I 2025-09-02 02:53:25,159] Trial 0 finished with value: 0.5418116605616605 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5418116605616605.
[I 2025-09-02 02:53:25,323] Trial 1 finished with value: 0.5292908719632857 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5418116605616605.


xgb test accuracy: 0.6864
xgb test F1 (positive): 0.6788

--- Optimizing DT ---


[I 2025-09-02 02:53:25,349] Trial 2 finished with value: 0.5435356896219964 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5435356896219964.
[I 2025-09-02 02:53:25,370] Trial 3 finished with value: 0.6343937181401508 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6343937181401508.
[I 2025-09-02 02:53:25,397] Trial 4 finished with value: 0.4083730492477338 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6343937181401508.
[I 2025-09-02 02:53:25,421] Trial 5 finished with value: 0.4924242655902799 and parameters: {'criterion': 'gini', 'max_depth': 19, 'min_samples_split': 19, 'min_samples_leaf': 6, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 2, 'min_samples_split': 13, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6641
dt test accuracy: 0.6627
dt test F1 (positive): 0.6780

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7241 Â± 0.1013
f1_positive       : 0.6704 Â± 0.1388
precision_positive: 0.6720 Â± 0.1282
recall_positive   : 0.6793 Â± 0.1708
f1_macro          : 0.7134 Â± 0.1074
Individual fold accuracies: ['0.7459', '0.5780', '0.7825', '0.8397', '0.6746']
Individual fold F1 (pos): ['0.7480', '0.4341', '0.7130', '0.7863', '0.6707']

XGB Results:
----------------------------------------
accuracy          : 0.6689 Â± 0.0760
f1_positive       : 0.5740 Â± 0.1032
precision_positive: 0.6323 Â± 0.0517
recall_positive   : 0.5488 Â± 0.1790
f1_macro          : 0.6488 Â± 0.0769
Individual fold accuracies: ['0.5656', '0.6243', '

[I 2025-09-02 02:53:29,306] Trial 0 finished with value: 0.6209576628651773 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6209576628651773.
[I 2025-09-02 02:53:30,901] Trial 1 finished with value: 0.6279827393170009 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6279827393170009.
[I 2025-09-02 02:53:39,942] Trial 2 finished with value: 0.6467709860694087 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 2 with value: 0.6467709860694087.
[I 2025-09-02 02:53:49,951] Trial 3 finished with value: 0.6406707491611738 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 250, 'max_depth': 3, 'min_samples_split': 13, 'min_samples_leaf': 5, 'max_features': None, 'bootstrap': True}
Best rf F1 score (positive class): 0.6832


[I 2025-09-02 02:58:46,349] A new study created in memory with name: no-name-a528cc94-cd8b-4544-a525-b570290f8615


rf test accuracy: 0.7575
rf test F1 (positive): 0.7619

--- Optimizing XGB ---


[I 2025-09-02 02:58:49,336] Trial 0 finished with value: 0.600423665733166 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.600423665733166.
[I 2025-09-02 02:58:51,623] Trial 1 finished with value: 0.5839063574060919 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.600423665733166.
[I 2025-09-02 02:58:53,574] Trial 2 finished with value: 0.6088812176793618 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.655

Best xgb params: {'n_estimators': 108, 'max_depth': 9, 'learning_rate': 0.028384751942895404, 'subsample': 0.6379535208204465, 'colsample_bytree': 0.994483952944437, 'min_child_weight': 3, 'gamma': 3.7417379735961407, 'reg_alpha': 1.2065158462718286, 'reg_lambda': 0.010779401703937867}
Best xgb F1 score (positive class): 0.6404


[I 2025-09-02 03:01:11,479] A new study created in memory with name: no-name-cfb42ef7-a6b3-47b8-baa8-d617fa1a490f
[I 2025-09-02 03:01:11,527] Trial 0 finished with value: 0.5408262983129936 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5408262983129936.


xgb test accuracy: 0.6940
xgb test F1 (positive): 0.6555

--- Optimizing DT ---


[I 2025-09-02 03:01:12,026] Trial 1 finished with value: 0.5677843546140294 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5677843546140294.
[I 2025-09-02 03:01:12,071] Trial 2 finished with value: 0.5663044649407613 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5677843546140294.
[I 2025-09-02 03:01:12,100] Trial 3 finished with value: 0.5478729306381971 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 1 with value: 0.5677843546140294.
[I 2025-09-02 03:01:12,127] Trial 4 finished with value: 0.4027451628115178 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 9, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.7104
dt test accuracy: 0.7201
dt test F1 (positive): 0.7350

OUTER FOLD 2/5
Train size: 1625, Test size: 618
Class distribution in test set: {'non-void': np.int64(368), 'void': np.int64(250)}

--- Optimizing RF ---


[I 2025-09-02 03:01:18,735] Trial 0 finished with value: 0.6285844040704364 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6285844040704364.
[I 2025-09-02 03:01:20,142] Trial 1 finished with value: 0.6817756000902465 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6817756000902465.
[I 2025-09-02 03:01:27,793] Trial 2 finished with value: 0.6550908759082312 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6817756000902465.
[I 2025-09-02 03:01:36,413] Trial 3 finished with value: 0.6560940337392643 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_feature

Best rf params: {'n_estimators': 104, 'max_depth': 3, 'min_samples_split': 11, 'min_samples_leaf': 9, 'max_features': 'log2', 'bootstrap': True}
Best rf F1 score (positive class): 0.7035
rf test accuracy: 0.6489
rf test F1 (positive): 0.4589

--- Optimizing XGB ---


[I 2025-09-02 03:03:04,716] Trial 0 finished with value: 0.642449535298792 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.642449535298792.
[I 2025-09-02 03:03:06,794] Trial 1 finished with value: 0.6614929171309579 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 1 with value: 0.6614929171309579.
[I 2025-09-02 03:03:08,686] Trial 2 finished with value: 0.661088477991212 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.655

Best xgb params: {'n_estimators': 80, 'max_depth': 3, 'learning_rate': 0.0536097259776323, 'subsample': 0.9214373883659217, 'colsample_bytree': 0.753040360130198, 'min_child_weight': 4, 'gamma': 0.373253746218435, 'reg_alpha': 0.1957578106671043, 'reg_lambda': 1.7051299982664783}
Best xgb F1 score (positive class): 0.6971


[I 2025-09-02 03:04:46,583] A new study created in memory with name: no-name-6b9bafe0-2151-414f-b558-bc7f1b7995d2
[I 2025-09-02 03:04:46,625] Trial 0 finished with value: 0.523576384506031 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.523576384506031.


xgb test accuracy: 0.6764
xgb test F1 (positive): 0.5169

--- Optimizing DT ---


[I 2025-09-02 03:04:47,008] Trial 1 finished with value: 0.5294524486048825 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5294524486048825.
[I 2025-09-02 03:04:47,049] Trial 2 finished with value: 0.5908525270563643 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.5908525270563643.
[I 2025-09-02 03:04:47,076] Trial 3 finished with value: 0.6417559502621475 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.6417559502621475.
[I 2025-09-02 03:04:47,100] Trial 4 finished with value: 0.6951261804602487 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 3, 'min_samples_split': 17, 'min_samples_leaf': 7, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.7076
dt test accuracy: 0.6521
dt test F1 (positive): 0.4557

OUTER FOLD 3/5
Train size: 1853, Test size: 390
Class distribution in test set: {'non-void': np.int64(206), 'void': np.int64(184)}

--- Optimizing RF ---


[I 2025-09-02 03:04:50,198] Trial 0 finished with value: 0.6047597628766864 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6047597628766864.
[I 2025-09-02 03:04:51,688] Trial 1 finished with value: 0.6322431167958144 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.6322431167958144.
[I 2025-09-02 03:05:00,092] Trial 2 finished with value: 0.6201712537871295 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.6322431167958144.
[I 2025-09-02 03:05:09,592] Trial 3 finished with value: 0.61051613708601 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features'

Best rf params: {'n_estimators': 486, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'bootstrap': False}
Best rf F1 score (positive class): 0.6348


[I 2025-09-02 03:07:39,379] A new study created in memory with name: no-name-5dbb926b-0316-44f3-b2ba-32672e4be309


rf test accuracy: 0.7718
rf test F1 (positive): 0.7575

--- Optimizing XGB ---


[I 2025-09-02 03:07:42,265] Trial 0 finished with value: 0.5847494578425722 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.5847494578425722.
[I 2025-09-02 03:07:44,307] Trial 1 finished with value: 0.5358133945095419 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.5847494578425722.
[I 2025-09-02 03:07:46,348] Trial 2 finished with value: 0.5797485041088765 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 186, 'max_depth': 3, 'learning_rate': 0.010320776639609446, 'subsample': 0.6527207681482519, 'colsample_bytree': 0.777685724416138, 'min_child_weight': 7, 'gamma': 2.6564248376658894, 'reg_alpha': 0.30387580226238625, 'reg_lambda': 0.46675031340062567}
Best xgb F1 score (positive class): 0.6375


[I 2025-09-02 03:09:34,991] A new study created in memory with name: no-name-b0956236-f477-47de-a24d-f204a755a455
[I 2025-09-02 03:09:35,034] Trial 0 finished with value: 0.5499704629775418 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5499704629775418.


xgb test accuracy: 0.7513
xgb test F1 (positive): 0.7221

--- Optimizing DT ---


[I 2025-09-02 03:09:35,466] Trial 1 finished with value: 0.5277762362806758 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 0 with value: 0.5499704629775418.
[I 2025-09-02 03:09:35,519] Trial 2 finished with value: 0.5300313100472919 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 0 with value: 0.5499704629775418.
[I 2025-09-02 03:09:35,564] Trial 3 finished with value: 0.5987168808152414 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 3 with value: 0.5987168808152414.
[I 2025-09-02 03:09:35,596] Trial 4 finished with value: 0.6181301656863876 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 17, 'min_samples_leaf': 7, 'max_features': 'log2', 'splitter': 'best'}
Best dt F1 score (positive class): 0.6432
dt test accuracy: 0.6308
dt test F1 (positive): 0.7012

OUTER FOLD 4/5
Train size: 1735, Test size: 508
Class distribution in test set: {'non-void': np.int64(287), 'void': np.int64(221)}

--- Optimizing RF ---


[I 2025-09-02 03:09:39,344] Trial 0 finished with value: 0.6603519747370318 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6603519747370318.
[I 2025-09-02 03:09:40,782] Trial 1 finished with value: 0.7016736478868698 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 1 with value: 0.7016736478868698.
[I 2025-09-02 03:09:48,824] Trial 2 finished with value: 0.665443448083621 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 1 with value: 0.7016736478868698.
[I 2025-09-02 03:09:57,820] Trial 3 finished with value: 0.6745247765378011 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 233, 'max_depth': 3, 'min_samples_split': 16, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'bootstrap': True}
Best rf F1 score (positive class): 0.7094


[I 2025-09-02 03:11:59,942] A new study created in memory with name: no-name-61659c35-9bed-4dd9-80a9-79785787b64f


rf test accuracy: 0.6772
rf test F1 (positive): 0.6784

--- Optimizing XGB ---


[I 2025-09-02 03:12:02,834] Trial 0 finished with value: 0.6284656442084745 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6284656442084745.
[I 2025-09-02 03:12:04,819] Trial 1 finished with value: 0.6215200222878206 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6284656442084745.
[I 2025-09-02 03:12:06,711] Trial 2 finished with value: 0.6549538818642722 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.

Best xgb params: {'n_estimators': 435, 'max_depth': 3, 'learning_rate': 0.010169261160219944, 'subsample': 0.8876628060388142, 'colsample_bytree': 0.9646768081772031, 'min_child_weight': 5, 'gamma': 1.9791428725852591, 'reg_alpha': 0.9048427174994054, 'reg_lambda': 0.024774184368885926}
Best xgb F1 score (positive class): 0.7061


[I 2025-09-02 03:14:39,762] A new study created in memory with name: no-name-0810bcdd-5e7c-4996-82c6-2c565ba32548
[I 2025-09-02 03:14:39,805] Trial 0 finished with value: 0.5232195978464635 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5232195978464635.


xgb test accuracy: 0.6614
xgb test F1 (positive): 0.6627

--- Optimizing DT ---


[I 2025-09-02 03:14:40,232] Trial 1 finished with value: 0.5504211359915385 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5504211359915385.
[I 2025-09-02 03:14:40,276] Trial 2 finished with value: 0.6748540946433218 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6748540946433218.
[I 2025-09-02 03:14:40,304] Trial 3 finished with value: 0.6517644615721662 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6748540946433218.
[I 2025-09-02 03:14:40,329] Trial 4 finished with value: 0.6369192140642963 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max_

Best dt params: {'criterion': 'gini', 'max_depth': 1, 'min_samples_split': 18, 'min_samples_leaf': 3, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.7134
dt test accuracy: 0.6949
dt test F1 (positive): 0.7036

OUTER FOLD 5/5
Train size: 1784, Test size: 459
Class distribution in test set: {'non-void': np.int64(285), 'void': np.int64(174)}

--- Optimizing RF ---


[I 2025-09-02 03:14:46,830] Trial 0 finished with value: 0.6532991361758484 and parameters: {'n_estimators': 218, 'max_depth': 20, 'min_samples_split': 15, 'min_samples_leaf': 6, 'max_features': 'sqrt', 'bootstrap': True}. Best is trial 0 with value: 0.6532991361758484.
[I 2025-09-02 03:14:48,350] Trial 1 finished with value: 0.6438577435407618 and parameters: {'n_estimators': 369, 'max_depth': 3, 'min_samples_split': 20, 'min_samples_leaf': 9, 'max_features': 'sqrt', 'bootstrap': False}. Best is trial 0 with value: 0.6532991361758484.
[I 2025-09-02 03:14:56,597] Trial 2 finished with value: 0.6606482953175196 and parameters: {'n_estimators': 244, 'max_depth': 8, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'bootstrap': True}. Best is trial 2 with value: 0.6606482953175196.
[I 2025-09-02 03:15:05,816] Trial 3 finished with value: 0.666067876244523 and parameters: {'n_estimators': 281, 'max_depth': 13, 'min_samples_split': 2, 'min_samples_leaf': 7, 'max_features

Best rf params: {'n_estimators': 361, 'max_depth': 3, 'min_samples_split': 15, 'min_samples_leaf': 9, 'max_features': None, 'bootstrap': False}
Best rf F1 score (positive class): 0.6719


[I 2025-09-02 03:21:48,457] A new study created in memory with name: no-name-abb08ed7-c0ba-49d4-bbc0-0ad7f80b19bf


rf test accuracy: 0.7712
rf test F1 (positive): 0.7395

--- Optimizing XGB ---


[I 2025-09-02 03:21:51,357] Trial 0 finished with value: 0.6478305033869775 and parameters: {'n_estimators': 218, 'max_depth': 12, 'learning_rate': 0.1205712628744377, 'subsample': 0.8394633936788146, 'colsample_bytree': 0.6624074561769746, 'min_child_weight': 2, 'gamma': 0.2904180608409973, 'reg_alpha': 1.7323522915498704, 'reg_lambda': 1.2022300234864176}. Best is trial 0 with value: 0.6478305033869775.
[I 2025-09-02 03:21:53,355] Trial 1 finished with value: 0.6219281582364747 and parameters: {'n_estimators': 369, 'max_depth': 3, 'learning_rate': 0.2708160864249968, 'subsample': 0.9329770563201687, 'colsample_bytree': 0.6849356442713105, 'min_child_weight': 2, 'gamma': 0.9170225492671691, 'reg_alpha': 0.6084844859190754, 'reg_lambda': 1.0495128632644757}. Best is trial 0 with value: 0.6478305033869775.
[I 2025-09-02 03:21:55,456] Trial 2 finished with value: 0.641064976983626 and parameters: {'n_estimators': 244, 'max_depth': 5, 'learning_rate': 0.08012737503998542, 'subsample': 0.6

Best xgb params: {'n_estimators': 382, 'max_depth': 8, 'learning_rate': 0.010484491810365239, 'subsample': 0.8520779079976167, 'colsample_bytree': 0.8248314235353149, 'min_child_weight': 3, 'gamma': 3.453269159253218, 'reg_alpha': 0.6540502747583534, 'reg_lambda': 1.3615312157450883}
Best xgb F1 score (positive class): 0.6696


[I 2025-09-02 03:24:48,446] A new study created in memory with name: no-name-1e4e1349-2ff1-40b0-bb6d-69ba6b3307b8
[I 2025-09-02 03:24:48,490] Trial 0 finished with value: 0.5119163872287597 and parameters: {'criterion': 'entropy', 'max_depth': 15, 'min_samples_split': 13, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'random'}. Best is trial 0 with value: 0.5119163872287597.


xgb test accuracy: 0.7625
xgb test F1 (positive): 0.6997

--- Optimizing DT ---


[I 2025-09-02 03:24:48,942] Trial 1 finished with value: 0.5799361773180488 and parameters: {'criterion': 'entropy', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features': None, 'splitter': 'best'}. Best is trial 1 with value: 0.5799361773180488.
[I 2025-09-02 03:24:48,985] Trial 2 finished with value: 0.6020814881260618 and parameters: {'criterion': 'gini', 'max_depth': 6, 'min_samples_split': 8, 'min_samples_leaf': 5, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6020814881260618.
[I 2025-09-02 03:24:49,013] Trial 3 finished with value: 0.5577695215211261 and parameters: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 20, 'min_samples_leaf': 10, 'max_features': 'sqrt', 'splitter': 'best'}. Best is trial 2 with value: 0.6020814881260618.
[I 2025-09-02 03:24:49,037] Trial 4 finished with value: 0.43346324728110924 and parameters: {'criterion': 'entropy', 'max_depth': 1, 'min_samples_split': 19, 'min_samples_leaf': 3, 'max

Best dt params: {'criterion': 'gini', 'max_depth': 2, 'min_samples_split': 4, 'min_samples_leaf': 7, 'max_features': None, 'splitter': 'best'}
Best dt F1 score (positive class): 0.6797
dt test accuracy: 0.8235
dt test F1 (positive): 0.8000

BINARY NESTED CROSS-VALIDATION RESULTS SUMMARY
Positive class: 'void'

RF Results:
----------------------------------------
accuracy          : 0.7253 Â± 0.0580
f1_positive       : 0.6792 Â± 0.1276
precision_positive: 0.6743 Â± 0.0776
recall_positive   : 0.7066 Â± 0.1932
f1_macro          : 0.7146 Â± 0.0750
Individual fold accuracies: ['0.7575', '0.6489', '0.7718', '0.6772', '0.7712']
Individual fold F1 (pos): ['0.7619', '0.4589', '0.7575', '0.6784', '0.7395']

XGB Results:
----------------------------------------
accuracy          : 0.7091 Â± 0.0453
f1_positive       : 0.6514 Â± 0.0799
precision_positive: 0.6860 Â± 0.0753
recall_positive   : 0.6370 Â± 0.1364
f1_macro          : 0.6977 Â± 0.0514
Individual fold accuracies: ['0.6940', '0.6764', '0.75