# Hyperparameter Optimization

## Imports

In [3]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import sys
import os
sys.path.append(os.path.abspath('../modules'))
from optimizer import optimize_pipeline

## Setup

In [4]:
np.random.seed(42)

In [5]:
train_data = pd.read_csv('../data/train_winsor_1_norm.csv')
X_train = train_data.drop(columns='class')
y_train = train_data['class']

In [6]:
best_trials = {}
model_names = ['KNN','DTR', 'SVM', 'RF', 'XGB', 'LGBM', 'MLP', 'LVQ']

In [7]:
X_train = np.ascontiguousarray(X_train.to_numpy())
y_train = np.ascontiguousarray(y_train.to_numpy())

## KNN

In [6]:
best_trials['KNN'] = optimize_pipeline(X_train, y_train, 'KNN')

[I 2024-11-30 21:21:00,822] A new study created in memory with name: optimization_KNN
[I 2024-11-30 21:21:01,157] Trial 0 finished with value: 0.8412312631050826 and parameters: {'n_neighbors': 7, 'weights': 'distance', 'algorithm': 'kd_tree', 'metric': 'euclidean'}. Best is trial 0 with value: 0.8412312631050826.
[I 2024-11-30 21:21:01,589] Trial 1 finished with value: 0.843725280062913 and parameters: {'n_neighbors': 8, 'weights': 'distance', 'algorithm': 'auto', 'metric': 'manhattan'}. Best is trial 1 with value: 0.843725280062913.
[I 2024-11-30 21:21:03,537] Trial 2 finished with value: 0.8293668926244887 and parameters: {'n_neighbors': 7, 'weights': 'distance', 'algorithm': 'ball_tree', 'metric': 'chebyshev'}. Best is trial 1 with value: 0.843725280062913.
[I 2024-11-30 21:21:04,047] Trial 3 finished with value: 0.8373773301454234 and parameters: {'n_neighbors': 6, 'weights': 'uniform', 'algorithm': 'auto', 'metric': 'euclidean'}. Best is trial 1 with value: 0.843725280062913.
[I 

Best trial:
Value: 0.845539139132965
Params:
  n_neighbors: 10
  weights: uniform
  algorithm: brute
  metric: manhattan


## DTR

In [7]:
best_trials['DTR'] = optimize_pipeline(X_train, y_train, 'DTR')

[I 2024-11-30 21:22:13,791] A new study created in memory with name: optimization_DTR
[I 2024-11-30 21:22:14,090] Trial 0 finished with value: 0.8287618921975876 and parameters: {'criterion': 'gini', 'splitter': 'best', 'max_depth': 13, 'min_samples_split': 4, 'min_samples_leaf': 2, 'max_features': 'sqrt'}. Best is trial 0 with value: 0.8287618921975876.
[I 2024-11-30 21:22:14,404] Trial 1 finished with value: 0.8233210859796213 and parameters: {'criterion': 'gini', 'splitter': 'best', 'max_depth': 15, 'min_samples_split': 5, 'min_samples_leaf': 2, 'max_features': 'log2'}. Best is trial 0 with value: 0.8287618921975876.
[I 2024-11-30 21:22:14,451] Trial 2 finished with value: 0.8153107626797518 and parameters: {'criterion': 'entropy', 'splitter': 'random', 'max_depth': 16, 'min_samples_split': 10, 'min_samples_leaf': 4, 'max_features': 'sqrt'}. Best is trial 0 with value: 0.8287618921975876.
[I 2024-11-30 21:22:14,716] Trial 3 finished with value: 0.813571775517914 and parameters: {'cr

Best trial:
Value: 0.8385108028855667
Params:
  criterion: gini
  splitter: best
  max_depth: 10
  min_samples_split: 2
  min_samples_leaf: 3
  max_features: sqrt


## LVQ

In [None]:
best_trials['LVQ'] = optimize_pipeline(X_train, y_train, 'LVQ', n_trials=20)

[I 2024-11-30 23:29:11,448] A new study created in memory with name: optimization_LVQ
[I 2024-11-30 23:31:54,412] Trial 0 finished with value: 0.7855375286159463 and parameters: {'n_codebooks': 10, 'lrate': 0.056052017320695036, 'epochs': 20}. Best is trial 0 with value: 0.7855375286159463.
[I 2024-11-30 23:43:04,831] Trial 1 finished with value: 0.7844791847814137 and parameters: {'n_codebooks': 14, 'lrate': 0.07907870487462496, 'epochs': 40}. Best is trial 0 with value: 0.7855375286159463.
[I 2024-11-30 23:48:54,780] Trial 2 finished with value: 0.654348981333708 and parameters: {'n_codebooks': 9, 'lrate': 0.4483866025242289, 'epochs': 33}. Best is trial 0 with value: 0.7855375286159463.
[I 2024-11-30 23:53:52,593] Trial 3 finished with value: 0.6956111697921834 and parameters: {'n_codebooks': 12, 'lrate': 0.3770618060221578, 'epochs': 21}. Best is trial 0 with value: 0.7855375286159463.
[I 2024-11-30 23:55:49,142] Trial 4 finished with value: 0.7231937009366984 and parameters: {'n_c

Best trial:
Value: 0.7932453945352644
Params:
  n_codebooks: 15
  lrate: 0.27565881193085223
  epochs: 32


: 

## SVM

In [8]:
best_trials['SVM'] = optimize_pipeline(X_train, y_train, 'SVM')

[I 2024-11-30 21:24:53,063] A new study created in memory with name: optimization_SVM
[I 2024-11-30 21:25:00,144] Trial 0 finished with value: 0.7190355972805106 and parameters: {'C': 0.12014256200518025, 'kernel': 'linear', 'gamma': 'scale'}. Best is trial 0 with value: 0.7190355972805106.
[I 2024-11-30 21:25:07,109] Trial 1 finished with value: 0.7145015349883395 and parameters: {'C': 0.10780512361824113, 'kernel': 'linear', 'gamma': 'auto'}. Best is trial 0 with value: 0.7190355972805106.
[I 2024-11-30 21:25:15,084] Trial 2 finished with value: 0.6989336892461724 and parameters: {'C': 0.7200398858973549, 'kernel': 'linear', 'gamma': 'scale'}. Best is trial 0 with value: 0.7190355972805106.
[I 2024-11-30 21:25:30,620] Trial 3 finished with value: 0.7069452118672259 and parameters: {'C': 1.3250460338788763, 'kernel': 'linear', 'gamma': 'scale'}. Best is trial 0 with value: 0.7190355972805106.
[I 2024-11-30 21:26:02,181] Trial 4 finished with value: 0.7772235486143414 and parameters: {

Best trial:
Value: 0.7822112969773394
Params:
  C: 0.2586833547879395
  kernel: rbf
  gamma: scale


## RF

In [10]:
best_trials['RF'] = optimize_pipeline(X_train, y_train, 'RF')

[I 2024-11-30 21:42:13,188] A new study created in memory with name: optimization_RF
[I 2024-11-30 21:42:36,930] Trial 0 finished with value: 0.8269482044591333 and parameters: {'n_estimators': 451, 'criterion': 'entropy', 'max_depth': 4, 'min_samples_split': 2, 'min_samples_leaf': 2, 'max_features': 'log2'}. Best is trial 0 with value: 0.8269482044591333.
[I 2024-11-30 21:43:26,543] Trial 1 finished with value: 0.86934249500497 and parameters: {'n_estimators': 443, 'criterion': 'gini', 'max_depth': 11, 'min_samples_split': 10, 'min_samples_leaf': 4, 'max_features': 'log2'}. Best is trial 1 with value: 0.86934249500497.
[I 2024-11-30 21:43:30,289] Trial 2 finished with value: 0.8485613428513747 and parameters: {'n_estimators': 51, 'criterion': 'entropy', 'max_depth': 6, 'min_samples_split': 4, 'min_samples_leaf': 2, 'max_features': 'sqrt'}. Best is trial 1 with value: 0.86934249500497.
[I 2024-11-30 21:43:43,150] Trial 3 finished with value: 0.8759925596398153 and parameters: {'n_estim

Best trial:
Value: 0.8768241175494669
Params:
  n_estimators: 209
  criterion: entropy
  max_depth: 20
  min_samples_split: 2
  min_samples_leaf: 3
  max_features: sqrt


## LGBM

In [11]:
best_trials['LGBM'] = optimize_pipeline(X_train, y_train, 'LGBM' )

[I 2024-11-30 22:15:32,893] A new study created in memory with name: optimization_LGBM


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001123 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001021 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:40,510] Trial 0 finished with value: 0.8772014182829662 and parameters: {'n_estimators': 190, 'learning_rate': 0.11461628957308397, 'num_leaves': 63, 'max_depth': 15, 'subsample': 0.8650774308778929}. Best is trial 0 with value: 0.8772014182829662.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000229 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000252 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:41,137] Trial 1 finished with value: 0.879090977363955 and parameters: {'n_estimators': 172, 'learning_rate': 0.09476437597274415, 'num_leaves': 41, 'max_depth': -1, 'subsample': 0.8398278348839231}. Best is trial 1 with value: 0.879090977363955.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000253 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000277 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:41,256] Trial 2 finished with value: 0.815990806346465 and parameters: {'n_estimators': 52, 'learning_rate': 0.010097875777634836, 'num_leaves': 37, 'max_depth': 4, 'subsample': 0.9680490016758833}. Best is trial 1 with value: 0.879090977363955.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3660
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000223 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654293 -> initscore=0.637964
[LightGBM] [Info] Start training from score 0.637964
[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000218 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:41,739] Trial 3 finished with value: 0.879166648819625 and parameters: {'n_estimators': 111, 'learning_rate': 0.06601007755810298, 'num_leaves': 49, 'max_depth': 8, 'subsample': 0.830189749976642}. Best is trial 3 with value: 0.879166648819625.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000309 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000232 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:42,506] Trial 4 finished with value: 0.8665464204403165 and parameters: {'n_estimators': 156, 'learning_rate': 0.011171734396780313, 'num_leaves': 51, 'max_depth': 0, 'subsample': 0.827756111320732}. Best is trial 3 with value: 0.879166648819625.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000228 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000247 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:43,364] Trial 5 finished with value: 0.8723652983839718 and parameters: {'n_estimators': 147, 'learning_rate': 0.021601075577837046, 'num_leaves': 38, 'max_depth': 18, 'subsample': 0.8410394409123473}. Best is trial 3 with value: 0.879166648819625.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000225 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000227 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:43,910] Trial 6 finished with value: 0.8779571334053499 and parameters: {'n_estimators': 110, 'learning_rate': 0.08117507622775699, 'num_leaves': 68, 'max_depth': 9, 'subsample': 0.8044327259402652}. Best is trial 3 with value: 0.879166648819625.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000231 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000218 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:44,038] Trial 7 finished with value: 0.7434448959032045 and parameters: {'n_estimators': 145, 'learning_rate': 0.013193974891683969, 'num_leaves': 38, 'max_depth': 1, 'subsample': 0.8261523235234827}. Best is trial 3 with value: 0.879166648819625.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000267 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3660
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000253 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654293 -> initscore=0.637964
[LightGBM] [Info] Start training from score 0.637964
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:44,830] Trial 8 finished with value: 0.8806779648433272 and parameters: {'n_estimators': 135, 'learning_rate': 0.0570863133473121, 'num_leaves': 59, 'max_depth': 18, 'subsample': 0.9673337839404407}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000241 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000340 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:45,397] Trial 9 finished with value: 0.8598962986949387 and parameters: {'n_estimators': 95, 'learning_rate': 0.012614452202011338, 'num_leaves': 32, 'max_depth': 19, 'subsample': 0.9474616639724682}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000230 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000248 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:46,472] Trial 10 finished with value: 0.8713074685442326 and parameters: {'n_estimators': 73, 'learning_rate': 0.03964053989397854, 'num_leaves': 59, 'max_depth': 14, 'subsample': 0.9959061585126769}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000255 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000240 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:46,996] Trial 11 finished with value: 0.8776549901327277 and parameters: {'n_estimators': 122, 'learning_rate': 0.04501372590169097, 'num_leaves': 51, 'max_depth': 8, 'subsample': 0.9078064837601895}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3660
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000233 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654293 -> initscore=0.637964
[LightGBM] [Info] Start training from score 0.637964
[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000222 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:47,448] Trial 12 finished with value: 0.8767480748753348 and parameters: {'n_estimators': 96, 'learning_rate': 0.17757315744684596, 'num_leaves': 57, 'max_depth': 12, 'subsample': 0.9042542977004592}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3660
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000245 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654293 -> initscore=0.637964
[LightGBM] [Info] Start training from score 0.637964
[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000208 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:47,982] Trial 13 finished with value: 0.8791664774880275 and parameters: {'n_estimators': 131, 'learning_rate': 0.05099700542595049, 'num_leaves': 45, 'max_depth': 6, 'subsample': 0.9351272796508798}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000228 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000210 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:48,909] Trial 14 finished with value: 0.8724407128422456 and parameters: {'n_estimators': 107, 'learning_rate': 0.0305203685291721, 'num_leaves': 55, 'max_depth': 12, 'subsample': 0.8748604133599854}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000340 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000254 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:49,648] Trial 15 finished with value: 0.8784107338103777 and parameters: {'n_estimators': 77, 'learning_rate': 0.06586532666362872, 'num_leaves': 46, 'max_depth': 16, 'subsample': 0.987183933790492}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3660
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000251 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654293 -> initscore=0.637964
[LightGBM] [Info] Start training from score 0.637964
[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000227 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:49,891] Trial 16 finished with value: 0.8795443778821188 and parameters: {'n_estimators': 130, 'learning_rate': 0.14216879844139196, 'num_leaves': 63, 'max_depth': 4, 'subsample': 0.9291446867329616}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000232 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000281 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:50,129] Trial 17 finished with value: 0.8800734498559528 and parameters: {'n_estimators': 165, 'learning_rate': 0.18762817481944616, 'num_leaves': 67, 'max_depth': 3, 'subsample': 0.932414209752847}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000234 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000315 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:50,513] Trial 18 finished with value: 0.8643550607499012 and parameters: {'n_estimators': 200, 'learning_rate': 0.019915135284848295, 'num_leaves': 70, 'max_depth': 4, 'subsample': 0.963687852806937}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3660
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000325 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654293 -> initscore=0.637964
[LightGBM] [Info] Start training from score 0.637964
[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000237 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:51,413] Trial 19 finished with value: 0.8779573047369474 and parameters: {'n_estimators': 175, 'learning_rate': 0.17596542708030297, 'num_leaves': 65, 'max_depth': 20, 'subsample': 0.9216182917830545}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000245 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000345 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:52,199] Trial 20 finished with value: 0.8782592766779717 and parameters: {'n_estimators': 167, 'learning_rate': 0.12598635350110143, 'num_leaves': 60, 'max_depth': 12, 'subsample': 0.966268242934369}. Best is trial 8 with value: 0.8806779648433272.
[I 2024-11-30 22:15:52,379] Trial 21 finished with value: 0.8760683453165509 and parameters: {'n_estimators': 134, 'learning_rate': 0.14022884395890572, 'num_leaves': 64, 'max_depth': 3, 'subsample': 0.9387645227474724}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000248 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000209 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:52,554] Trial 22 finished with value: 0.8726677272092568 and parameters: {'n_estimators': 151, 'learning_rate': 0.18283497990238473, 'num_leaves': 67, 'max_depth': 2, 'subsample': 0.8819516152786502}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000252 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000289 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:53,033] Trial 23 finished with value: 0.8796954637960628 and parameters: {'n_estimators': 161, 'learning_rate': 0.09458096121804523, 'num_leaves': 61, 'max_depth': 6, 'subsample': 0.9218349714013988}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3660
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000263 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654293 -> initscore=0.637964
[LightGBM] [Info] Start training from score 0.637964
[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000223 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:53,524] Trial 24 finished with value: 0.8799223068314763 and parameters: {'n_estimators': 161, 'learning_rate': 0.09320699580520173, 'num_leaves': 54, 'max_depth': 6, 'subsample': 0.955719738280756}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000263 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000248 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:54,353] Trial 25 finished with value: 0.8802244786593647 and parameters: {'n_estimators': 191, 'learning_rate': 0.06267267110330704, 'num_leaves': 54, 'max_depth': 10, 'subsample': 0.9527155435318613}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000239 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000240 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:55,212] Trial 26 finished with value: 0.880299950228171 and parameters: {'n_estimators': 181, 'learning_rate': 0.031204806135314348, 'num_leaves': 56, 'max_depth': 10, 'subsample': 0.9802516518435477}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000221 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000241 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:56,054] Trial 27 finished with value: 0.878335319352104 and parameters: {'n_estimators': 182, 'learning_rate': 0.032689079705160176, 'num_leaves': 54, 'max_depth': 11, 'subsample': 0.978708478975611}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000259 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000240 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:56,924] Trial 28 finished with value: 0.8802999216729045 and parameters: {'n_estimators': 187, 'learning_rate': 0.05897908505894192, 'num_leaves': 57, 'max_depth': 16, 'subsample': 0.982223257100736}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000247 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000232 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:57,870] Trial 29 finished with value: 0.8772015039487651 and parameters: {'n_estimators': 186, 'learning_rate': 0.023690681378569618, 'num_leaves': 57, 'max_depth': 16, 'subsample': 0.9985305562717712}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000293 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000256 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:58,678] Trial 30 finished with value: 0.8781085048719568 and parameters: {'n_estimators': 198, 'learning_rate': 0.029405257826460928, 'num_leaves': 48, 'max_depth': 14, 'subsample': 0.9800737623231724}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000256 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000236 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:15:59,611] Trial 31 finished with value: 0.8800733927454203 and parameters: {'n_estimators': 191, 'learning_rate': 0.06186722138123315, 'num_leaves': 57, 'max_depth': 17, 'subsample': 0.9512189014792817}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000234 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000260 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:00,521] Trial 32 finished with value: 0.8792424059410944 and parameters: {'n_estimators': 178, 'learning_rate': 0.039032135046039765, 'num_leaves': 53, 'max_depth': 14, 'subsample': 0.976008470878595}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000216 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000256 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:01,553] Trial 33 finished with value: 0.880073249969089 and parameters: {'n_estimators': 191, 'learning_rate': 0.05134494511982561, 'num_leaves': 62, 'max_depth': 20, 'subsample': 0.9582848453457649}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000235 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000273 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:02,394] Trial 34 finished with value: 0.8803753646864445 and parameters: {'n_estimators': 174, 'learning_rate': 0.07222182007807802, 'num_leaves': 58, 'max_depth': 11, 'subsample': 0.9851906884303728}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000237 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000262 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:03,369] Trial 35 finished with value: 0.8793932348576419 and parameters: {'n_estimators': 173, 'learning_rate': 0.05330625339432408, 'num_leaves': 59, 'max_depth': 18, 'subsample': 0.9887094668409597}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000297 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000237 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:04,296] Trial 36 finished with value: 0.8773526184179754 and parameters: {'n_estimators': 140, 'learning_rate': 0.08002502608925748, 'num_leaves': 57, 'max_depth': 15, 'subsample': 0.9718788066206465}. Best is trial 8 with value: 0.8806779648433272.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000290 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000565 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:05,790] Trial 37 finished with value: 0.8819625520526811 and parameters: {'n_estimators': 180, 'learning_rate': 0.07583413324306121, 'num_leaves': 52, 'max_depth': 13, 'subsample': 0.9871762027079203}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000399 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000240 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:07,195] Trial 38 finished with value: 0.8807534649673998 and parameters: {'n_estimators': 120, 'learning_rate': 0.10991458405878535, 'num_leaves': 51, 'max_depth': 9, 'subsample': 0.9917641113825257}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000275 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000237 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:08,486] Trial 39 finished with value: 0.8793174491809065 and parameters: {'n_estimators': 121, 'learning_rate': 0.07593257500953825, 'num_leaves': 42, 'max_depth': 8, 'subsample': 0.9943639690446181}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000243 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000349 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:09,193] Trial 40 finished with value: 0.8797712209175321 and parameters: {'n_estimators': 116, 'learning_rate': 0.11106081308813905, 'num_leaves': 51, 'max_depth': 9, 'subsample': 0.9992852577716177}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000232 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000261 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:09,658] Trial 41 finished with value: 0.8776547616905974 and parameters: {'n_estimators': 103, 'learning_rate': 0.108202305157204, 'num_leaves': 49, 'max_depth': 10, 'subsample': 0.9682220678181936}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000251 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000264 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:10,393] Trial 42 finished with value: 0.8796197637851263 and parameters: {'n_estimators': 153, 'learning_rate': 0.07487880752674644, 'num_leaves': 52, 'max_depth': 13, 'subsample': 0.9848754649099276}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000295 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000254 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:10,960] Trial 43 finished with value: 0.8778060760466719 and parameters: {'n_estimators': 139, 'learning_rate': 0.0427277973390866, 'num_leaves': 46, 'max_depth': 7, 'subsample': 0.9434971087377448}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000259 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000322 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:11,398] Trial 44 finished with value: 0.8725162129663182 and parameters: {'n_estimators': 83, 'learning_rate': 0.03484650896274102, 'num_leaves': 49, 'max_depth': 11, 'subsample': 0.9729485062825621}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000264 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000259 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:12,254] Trial 45 finished with value: 0.8774284612052436 and parameters: {'n_estimators': 170, 'learning_rate': 0.026697705366761342, 'num_leaves': 55, 'max_depth': 11, 'subsample': 0.8526132240911273}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000244 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000268 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:13,077] Trial 46 finished with value: 0.8787132483014612 and parameters: {'n_estimators': 157, 'learning_rate': 0.09031399710227835, 'num_leaves': 59, 'max_depth': 13, 'subsample': 0.9883705006196398}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000272 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000248 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:13,770] Trial 47 finished with value: 0.8803002072255675 and parameters: {'n_estimators': 181, 'learning_rate': 0.04846433399792349, 'num_leaves': 43, 'max_depth': 9, 'subsample': 0.9613641671129931}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000323 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000227 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:14,228] Trial 48 finished with value: 0.8799220783893459 and parameters: {'n_estimators': 145, 'learning_rate': 0.07196157214851302, 'num_leaves': 35, 'max_depth': 7, 'subsample': 0.9608003689090032}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3660
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000274 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654293 -> initscore=0.637964
[LightGBM] [Info] Start training from score 0.637964
[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000249 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
[LightGBM] [Info] Nu

[I 2024-11-30 22:16:14,527] Trial 49 finished with value: 0.8707027251147279 and parameters: {'n_estimators': 58, 'learning_rate': 0.04792039987253527, 'num_leaves': 43, 'max_depth': 9, 'subsample': 0.8914519033081411}. Best is trial 37 with value: 0.8819625520526811.


[LightGBM] [Info] Number of positive: 6928, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000290 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10587, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654387 -> initscore=0.638381
[LightGBM] [Info] Start training from score 0.638381
Best trial:
Value: 0.8819625520526811
Params:
  n_estimators: 180
  learning_rate: 0.07583413324306121
  num_leaves: 52
  max_depth: 13
  subsample: 0.9871762027079203


## XGB

Otimização interrompida devido a tempo de execução superior a 1 hora

In [12]:
best_trials['XGB'] = optimize_pipeline(X_train, y_train, 'XGB')

[I 2024-11-30 22:16:14,533] A new study created in memory with name: optimization_XGB
[I 2024-11-30 22:16:41,448] Trial 0 finished with value: 0.8732720708650332 and parameters: {'learning_rate': 0.05631640289815015, 'loss': 'exponential', 'n_estimators': 256, 'max_depth': 3, 'subsample': 0.7306921064756602, 'criterion': 'friedman_mse'}. Best is trial 0 with value: 0.8732720708650332.
[I 2024-11-30 22:17:24,698] Trial 1 finished with value: 0.8582340109783576 and parameters: {'learning_rate': 0.011951044961068002, 'loss': 'exponential', 'n_estimators': 354, 'max_depth': 3, 'subsample': 0.8635815322317826, 'criterion': 'squared_error'}. Best is trial 0 with value: 0.8732720708650332.
[I 2024-11-30 22:19:01,185] Trial 2 finished with value: 0.8821134380797611 and parameters: {'learning_rate': 0.060357757311170275, 'loss': 'exponential', 'n_estimators': 450, 'max_depth': 6, 'subsample': 0.6903793600904184, 'criterion': 'squared_error'}. Best is trial 2 with value: 0.8821134380797611.
[I 2

KeyboardInterrupt: 

## MLP

In [None]:
best_trials['MLP'] = optimize_pipeline(X_train, y_train, 'MLP',n_trials=20)

[I 2024-11-30 23:31:48,486] A new study created in memory with name: optimization_MLP
[I 2024-11-30 23:33:51,832] Trial 0 finished with value: 0.8724410269501748 and parameters: {'hidden_layer_sizes': '(100,)', 'activation': 'relu', 'solver': 'adam', 'alpha': 0.008350794253187403}. Best is trial 0 with value: 0.8724410269501748.
STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  self.n_iter_ = _check_optimize_result("lbfgs", opt_res, self.max_iter)
STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  self.n_iter_ = _check_optimize_result("lbfgs", opt_res, self.max_iter)
STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/st

Best trial:
Value: 0.8770508463638151
Params:
  hidden_layer_sizes: (100, 50)
  activation: relu
  solver: adam
  alpha: 0.005067506187907968


: 

## Best individual models

In [8]:
import random
import optuna
from sklearn.model_selection import cross_val_score, StratifiedKFold
from sklearn.neural_network import MLPClassifier
from sklearn.pipeline import Pipeline
from sklearn.decomposition import PCA
from sklearn.ensemble import RandomForestClassifier, StackingClassifier
from sklearn.linear_model import LogisticRegression
from lightgbm import LGBMClassifier
from sklearn.ensemble import GradientBoostingClassifier, RandomForestClassifier, StackingClassifier, VotingClassifier
from sklearn.neighbors import KNeighborsClassifier
from sklearn.neural_network import MLPClassifier
from sklearn.svm import SVC
from sklearn.tree import DecisionTreeClassifier
from lvq_classifier import LVQ
from itertools import combinations

In [None]:
best_models = {
    'KNN': KNeighborsClassifier(n_neighbors=10,
                                           weights='uniform',
                                           algorithm='brute',
                                           metric='manhattan'),

    'LVQ': LVQ(n_codebooks=15,lrate=0.2756588,epochs=32),
    'DTR': DecisionTreeClassifier(criterion='gini',
                                             splitter='best',
                                             max_depth=10, 
                                             min_samples_split=2,
                                             min_samples_leaf=3,
                                             max_features='sqrt'),

    'SVM': SVC(probability=True, 
                          max_iter=1000, 
                          C=0.25868,
                          kernel='rbf',
                          gamma='scale'),

    'RF': RandomForestClassifier(n_estimators=366,
                                             criterion='entropy',
                                             max_depth=20, 
                                             min_samples_split=2,
                                             min_samples_leaf=3, 
                                             max_features='sqrt'),

    'XGB': GradientBoostingClassifier(learning_rate=0.05147,
                                                 loss='log_loss',
                                                 n_estimators=374,
                                                 max_depth=6, 
                                                 subsample=0.571017, 
                                                 criterion='friedman_mse'),

    'LGBM': LGBMClassifier(n_estimators=180,
                                     learning_rate=0.0758,
                                     num_leaves=52,
                                     max_depth=13,
                                     subsample=0.987176),

    'MLP': MLPClassifier(hidden_layer_sizes=(100,50),
                                    activation='relu',
                                    solver='adam',
                                    alpha=0.005,
                                    max_iter=200)
} 

## ANNs Ensemble

### Stacking

#### 2 ANNs

In [None]:
n_members = 2

ann_models = [best_models['MLP'] for _ in range(n_members)]

estimators = [(f'ann_{i+1}', model) for i, model in enumerate(ann_models)]

# Create a stacking ensemble with ANN models
ann_stack_2 = StackingClassifier(
    estimators=estimators,
    final_estimator=LogisticRegression()
)

In [None]:
cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
scores = cross_val_score(ann_stack_2, X_train, y_train, cv=cv, scoring='accuracy')



In [None]:
scores

array([0.87004156, 0.87230827, 0.87041934, 0.8760393 , 0.88397581])

In [None]:
print(f'Mean accuracy: {round(scores.mean() * 100, 2)}% ± {round(scores.std() * 100, 2)}')

Mean accuracy: 87.46% ± 0.52


#### 3 ANNs

In [None]:
n_members = 3

ann_models = [best_models['MLP'] for _ in range(n_members)]

estimators = [(f'ann_{i+1}', model) for i, model in enumerate(ann_models)]

# Create a stacking ensemble with ANN models
ann_stack_3 = StackingClassifier(
    estimators=estimators,
    final_estimator=LogisticRegression()
)

cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
scores = cross_val_score(ann_stack_3, X_train, y_train, cv=cv, scoring='accuracy')



In [None]:
scores

array([0.87004156, 0.87608614, 0.8689082 , 0.87830688, 0.88548753])

In [None]:
print(f'Mean accuracy: {round(scores.mean() * 100, 2)}% ± {round(scores.std() * 100, 2)}')

Mean accuracy: 87.58% ± 0.6


### Voting

#### 2 ANNs

In [None]:
n_members = 2

ann_models = [best_models['MLP'] for _ in range(n_members)]

estimators = [(f'ann_{i+1}', model) for i, model in enumerate(ann_models)]

# Create a stacking ensemble with ANN models
ann_stack_2 = VotingClassifier(
    estimators=estimators,
    voting='soft'
)

cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
scores = cross_val_score(ann_stack_2, X_train, y_train, cv=cv, scoring='accuracy')



In [None]:
scores

array([0.87041934, 0.87306385, 0.87306385, 0.88019652, 0.88435374])

In [None]:
print(f'Mean accuracy: {round(scores.mean() * 100, 2)}% ± {round(scores.std() * 100, 2)}')

Mean accuracy: 87.62% ± 0.52


#### 3 ANNS

In [None]:
n_members = 3

ann_models = [best_models['MLP'] for _ in range(n_members)]

estimators = [(f'ann_{i+1}', model) for i, model in enumerate(ann_models)]

# Create a stacking ensemble with ANN models
ann_stack_3 = VotingClassifier(
    estimators=estimators,
    voting='soft'
)

cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
scores = cross_val_score(ann_stack_3, X_train, y_train, cv=cv, scoring='accuracy')



In [None]:
scores

array([0.87004156, 0.87041934, 0.87117491, 0.88057445, 0.88586546])

In [None]:
print(f'Mean accuracy: {round(scores.mean() * 100, 2)}% ± {round(scores.std() * 100, 2)}')

Mean accuracy: 87.56% ± 0.64


## Heterogeneous Voting Ensemble

In [17]:
models_to_test = best_models.copy()
models_to_delete = ['MLP','LVQ','DTR','SVM']
for model_name in models_to_delete:
    models_to_test.pop(model_name)
print(models_to_test.keys())

dict_keys(['KNN', 'RF', 'XGB', 'LGBM'])


In [18]:
model_names = list(models_to_test.keys())

    # Generate all possible subsets of models
all_combinations = [
    list(combo) for r in range(2, 5)
    for combo in combinations(model_names, r)
]

all_combinations

[['KNN', 'RF'],
 ['KNN', 'XGB'],
 ['KNN', 'LGBM'],
 ['RF', 'XGB'],
 ['RF', 'LGBM'],
 ['XGB', 'LGBM'],
 ['KNN', 'RF', 'XGB'],
 ['KNN', 'RF', 'LGBM'],
 ['KNN', 'XGB', 'LGBM'],
 ['RF', 'XGB', 'LGBM'],
 ['KNN', 'RF', 'XGB', 'LGBM']]

In [19]:
import warnings

def optimize_ensemble_model(X, y, models_to_test, n_trials=30, cv_folds=5, scoring='accuracy'):
    """
    Optimize a voting ensemble with 2 to 4 classifier pipelines.

    Parameters:
    - X (pd.DataFrame): Feature matrix.
    - y (pd.Series): Target vector.
    - pipelines_to_test (dict): dictionary with the model names as keys and the classifier pipelines as items.
    - n_trials (int): Number of optimization trials.
    - cv_folds (int): Number of cross-validation folds.
    - scoring (str): Scoring metric for cross-validation.

    Returns:
    - study.best_trial: The best trial from the optimization study.
    """
    warnings.filterwarnings('ignore')
    model_names = list(models_to_test.keys())

    # Generate all possible subsets of models
    all_combinations = [
        list(combo) for r in range(2, 5)
        for combo in combinations(model_names, r)
    ]

    print(f'All these combinations will be tested: {all_combinations}')

    def objective(trial):
        # Select a combination of models
        selected_models = trial.suggest_categorical('model_combination', all_combinations)
        ensemble_type = trial.suggest_categorical('ensemble_type', ['voting','stack'])

        # Build the VotingClassifier with the selected models
        estimators = [
            (f'pipeline_{i+1}', models_to_test[model])
            for i, model in enumerate(selected_models)
        ]

        if ensemble_type == 'voting':
            ensemble = VotingClassifier(estimators=estimators, voting='soft')
        else:
            ensemble = StackingClassifier(estimators=estimators,final_estimator=LogisticRegression())

        # Perform cross-validation
        cv = StratifiedKFold(n_splits=cv_folds, shuffle=True, random_state=42)
        scores = cross_val_score(ensemble, X, y, cv=cv, scoring=scoring, error_score='raise')
        return scores.mean()

    # Create and run the Optuna study
    study = optuna.create_study(study_name=f'optimization_voting_model', direction="maximize")
    study.optimize(objective, n_trials=n_trials)

    # Print the best trial
    print("Best trial:")
    print(f"Value: {study.best_trial.value}")
    print("Params:")
    for key, value in study.best_trial.params.items():
        print(f"  {key}: {value}")

    return study.best_trial

In [20]:
optimize_ensemble_model(X_train, y_train, models_to_test, n_trials=50)

[I 2024-12-01 09:38:53,031] A new study created in memory with name: optimization_voting_model


All these combinations will be tested: [['KNN', 'RF'], ['KNN', 'XGB'], ['KNN', 'LGBM'], ['RF', 'XGB'], ['RF', 'LGBM'], ['XGB', 'LGBM'], ['KNN', 'RF', 'XGB'], ['KNN', 'RF', 'LGBM'], ['KNN', 'XGB', 'LGBM'], ['RF', 'XGB', 'LGBM'], ['KNN', 'RF', 'XGB', 'LGBM']]


  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\site-packages\joblib\externals\loky\backend\context.py", line 227, in _count_physical_cores
    cpu_info = subprocess.run(
               ^^^^^^^^^^^^^^^
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\subprocess.py", line 548, in run
    with Popen(*popenargs, **kwargs) as process:
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\subprocess.py", line 1026, in __init__
    self._execute_child(args, executable, preexec_fn, close_fds,
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\subprocess.py", line 1538, in _execute_child
    hp, ht, pid, tid = _winapi.CreateProcess(executable, args,
                       ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000830 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000236 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM

[I 2024-12-01 09:39:46,913] Trial 0 finished with value: 0.8765217458347146 and parameters: {'model_combination': ['KNN', 'RF', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 0 with value: 0.8765217458347146.
[I 2024-12-01 09:47:04,229] Trial 1 finished with value: 0.8749350439080052 and parameters: {'model_combination': ['KNN', 'RF'], 'ensemble_type': 'stack'}. Best is trial 0 with value: 0.8765217458347146.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001716 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000264 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 09:54:46,880] Trial 2 finished with value: 0.8824159811261112 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 2 with value: 0.8824159811261112.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002588 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002984 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 10:13:24,021] Trial 3 finished with value: 0.8815093514213812 and parameters: {'model_combination': ['KNN', 'XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 2 with value: 0.8824159811261112.
[I 2024-12-01 10:20:00,245] Trial 4 finished with value: 0.8771264892642192 and parameters: {'model_combination': ['KNN', 'RF', 'XGB'], 'ensemble_type': 'voting'}. Best is trial 2 with value: 0.8824159811261112.
[I 2024-12-01 10:21:50,775] Trial 5 finished with value: 0.8655644333878453 and parameters: {'model_combination': ['KNN', 'RF'], 'ensemble_type': 'voting'}. Best is trial 2 with value: 0.8824159811261112.
[I 2024-12-01 10:36:56,576] Trial 6 finished with value: 0.875161715611821 and parameters: {'model_combination': ['KNN', 'RF'], 'ensemble_type': 'stack'}. Best is trial 2 with value: 0.8824159811261112.
[I 2024-12-01 10:44:24,866] Trial 7 finished with value: 0.8764464170422398 and parameters: {'model_combination': ['KNN', 'RF', 'XGB'], 'ensemble_type': 'voting'}. Bes

[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002473 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000500 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 10:45:18,702] Trial 8 finished with value: 0.8790907774770907 and parameters: {'model_combination': ['KNN', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 2 with value: 0.8824159811261112.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001979 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003287 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Nu

[I 2024-12-01 10:52:10,019] Trial 9 finished with value: 0.8807536077437315 and parameters: {'model_combination': ['KNN', 'RF', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 2 with value: 0.8824159811261112.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001830 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000412 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 11:08:48,614] Trial 10 finished with value: 0.882416152457709 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 10 with value: 0.882416152457709.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000732 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000454 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 11:19:34,533] Trial 11 finished with value: 0.8821893665328281 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 10 with value: 0.882416152457709.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000987 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000518 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 11:51:18,670] Trial 12 finished with value: 0.8811313082509585 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 10 with value: 0.882416152457709.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000592 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000245 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 11:58:23,776] Trial 13 finished with value: 0.8833984821733758 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 13 with value: 0.8833984821733758.




[I 2024-12-01 12:14:12,449] Trial 14 finished with value: 0.8815092657555823 and parameters: {'model_combination': ['RF', 'XGB'], 'ensemble_type': 'stack'}. Best is trial 13 with value: 0.8833984821733758.
[I 2024-12-01 12:21:48,823] Trial 15 finished with value: 0.8799982067292769 and parameters: {'model_combination': ['KNN', 'XGB'], 'ensemble_type': 'stack'}. Best is trial 13 with value: 0.8833984821733758.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002330 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004260 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 12:35:17,811] Trial 16 finished with value: 0.8831715820274295 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 13 with value: 0.8833984821733758.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000605 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000284 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 12:40:37,499] Trial 17 finished with value: 0.8820381949530851 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 13 with value: 0.8833984821733758.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000280 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002611 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 13:03:09,856] Trial 18 finished with value: 0.8818116089150683 and parameters: {'model_combination': ['RF', 'XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 13 with value: 0.8833984821733758.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004585 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001081 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 13:15:37,864] Trial 19 finished with value: 0.8803759072365042 and parameters: {'model_combination': ['RF', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 13 with value: 0.8833984821733758.


[LightGBM] [Info] Number of positive: 6927, number of negative: 3659
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000597 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 10586, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654355 -> initscore=0.638237
[LightGBM] [Info] Start training from score 0.638237
[LightGBM] [Info] Number of positive: 5541, number of negative: 2927
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002300 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2550
[LightGBM] [Info] Number of data points in the train set: 8468, number of used features: 10
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.654346 -> initscore=0.638197
[LightGBM] [Info] Start training from score 0.638197
[LightGBM] [Info] Num

[I 2024-12-01 13:25:16,372] Trial 20 finished with value: 0.8797711352517332 and parameters: {'model_combination': ['RF', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 13 with value: 0.8833984821733758.




[W 2024-12-01 13:25:20,115] Trial 21 failed with parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'stack'} because of the following error: KeyboardInterrupt().
Traceback (most recent call last):
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\site-packages\optuna\study\_optimize.py", line 197, in _run_trial
    value_or_values = func(trial)
                      ^^^^^^^^^^^
  File "C:\Users\giull\AppData\Local\Temp\ipykernel_27916\3586193229.py", line 47, in objective
    scores = cross_val_score(ensemble, X, y, cv=cv, scoring=scoring, error_score='raise')
             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\site-packages\sklearn\model_selection\_validation.py", line 562, in cross_val_score
    cv_results = cross_validate(
                 ^^^^^^^^^^^^^^^
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\site-packages\sklearn\uti

KeyboardInterrupt: 