# Hyperparameter Optimization

## Imports

In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.model_selection import train_test_split
import sys
import os
sys.path.append(os.path.abspath('../modules'))
from optimizer import optimize_pipeline
from preproc import PhishingDatasetPreproc

## Setup

In [2]:
np.random.seed(42)

In [3]:
prep = PhishingDatasetPreproc()
dataset, X, y = prep.basic_operations()

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.25)

In [4]:
best_trials = {}
model_names = ['KNN','DTR', 'SVM', 'RF', 'XGB', 'LGBM', 'MLP', 'LVQ']
selectors = ['tree', 'pca', 'univariate', 'l1']

## KNN

In [5]:
best_trials['KNN'] = optimize_pipeline(X_train, y_train, 'KNN', selectors)

[I 2024-11-21 21:45:33,519] A new study created in memory with name: optimization_KNN
[I 2024-11-21 21:45:34,879] Trial 0 finished with value: 0.9422265218557839 and parameters: {'fs_method': 'pca', 'selector__n_components': 15, 'n_neighbors': 3, 'weights': 'uniform', 'algorithm': 'kd_tree', 'metric': 'manhattan'}. Best is trial 0 with value: 0.9422265218557839.
[I 2024-11-21 21:45:37,262] Trial 1 finished with value: 0.9387281131322297 and parameters: {'fs_method': 'l1', 'selector__C': 0.037795630022668024, 'n_neighbors': 9, 'weights': 'uniform', 'algorithm': 'brute', 'metric': 'manhattan'}. Best is trial 0 with value: 0.9422265218557839.
[WinError 2] O sistema não pode encontrar o arquivo especificado
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\site-packages\joblib\externals\loky\backend\context.py", line 227, in _count_physical_cores
    cpu_info = subprocess.run(
               ^^^^^^^^^^^^^^^
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib

Best trial:
Value: 0.9611623843625189
Params:
  fs_method: l1
  selector__C: 0.3354128676560216
  n_neighbors: 5
  weights: distance
  algorithm: auto
  metric: manhattan


## DTR

In [6]:
best_trials['DTR'] = optimize_pipeline(X_train, y_train, 'DTR', selectors)

[I 2024-11-21 21:51:21,259] A new study created in memory with name: optimization_DTR
[I 2024-11-21 21:51:22,251] Trial 0 finished with value: 0.9263069952905199 and parameters: {'fs_method': 'l1', 'selector__C': 0.6214274066222929, 'criterion': 'gini', 'splitter': 'random', 'max_depth': 16, 'min_samples_split': 7, 'min_samples_leaf': 2, 'max_features': 'sqrt'}. Best is trial 0 with value: 0.9263069952905199.
[I 2024-11-21 21:51:29,214] Trial 1 finished with value: 0.8744423624911019 and parameters: {'fs_method': 'univariate', 'selector__k': 7, 'criterion': 'entropy', 'splitter': 'random', 'max_depth': 3, 'min_samples_split': 4, 'min_samples_leaf': 2, 'max_features': 'log2'}. Best is trial 0 with value: 0.9263069952905199.
[I 2024-11-21 21:51:29,940] Trial 2 finished with value: 0.9211180598424648 and parameters: {'fs_method': 'l1', 'selector__C': 0.321605194225023, 'criterion': 'gini', 'splitter': 'random', 'max_depth': 17, 'min_samples_split': 6, 'min_samples_leaf': 2, 'max_features'

Best trial:
Value: 0.9353515677544934
Params:
  fs_method: tree
  selector__n_estimators: 112
  criterion: entropy
  splitter: random
  max_depth: 11
  min_samples_split: 4
  min_samples_leaf: 2
  max_features: log2


## LVQ

In [5]:
best_trials['LVQ'] = optimize_pipeline(X_train, y_train, 'LVQ', selectors)

[I 2024-11-21 23:45:00,208] A new study created in memory with name: optimization_LVQ
[I 2024-11-21 23:46:03,492] Trial 0 finished with value: 0.5164748191499959 and parameters: {'fs_method': 'tree', 'selector__n_estimators': 12, 'n_codebooks': 9, 'lrate': 0.07851678281285167, 'epochs': 23}. Best is trial 0 with value: 0.5164748191499959.
[I 2024-11-21 23:47:23,056] Trial 1 finished with value: 0.8832464802506488 and parameters: {'fs_method': 'pca', 'selector__n_components': 26, 'n_codebooks': 8, 'lrate': 0.110930321378087, 'epochs': 26}. Best is trial 1 with value: 0.8832464802506488.
[I 2024-11-21 23:48:57,739] Trial 2 finished with value: 0.8804724894951033 and parameters: {'fs_method': 'pca', 'selector__n_components': 21, 'n_codebooks': 8, 'lrate': 0.2632175752701811, 'epochs': 29}. Best is trial 1 with value: 0.8832464802506488.
[I 2024-11-21 23:49:20,196] Trial 3 finished with value: 0.7445266561526811 and parameters: {'fs_method': 'pca', 'selector__n_components': 19, 'n_codebook

Best trial:
Value: 0.8900018977525811
Params:
  fs_method: pca
  selector__n_components: 25
  n_codebooks: 15
  lrate: 0.23668848148998023
  epochs: 20


## SVM

In [None]:
best_trials['SVM'] = optimize_pipeline(X_train, y_train, 'SVM', selectors)

[I 2024-11-21 22:51:02,066] A new study created in memory with name: optimization_SVM
[I 2024-11-21 22:51:11,692] Trial 0 finished with value: 0.9340243770318132 and parameters: {'fs_method': 'univariate', 'selector__k': 10, 'C': 0.5984723098143647, 'kernel': 'rbf', 'gamma': 'auto'}. Best is trial 0 with value: 0.9340243770318132.
[I 2024-11-21 22:51:17,898] Trial 1 finished with value: 0.8167826767909222 and parameters: {'fs_method': 'univariate', 'selector__k': 11, 'C': 1.8199137153986849, 'kernel': 'linear', 'gamma': 'scale'}. Best is trial 0 with value: 0.9340243770318132.
[I 2024-11-21 22:51:21,639] Trial 2 finished with value: 0.9189469145524176 and parameters: {'fs_method': 'pca', 'selector__n_components': 12, 'C': 0.2202113852543002, 'kernel': 'linear', 'gamma': 'auto'}. Best is trial 0 with value: 0.9340243770318132.
[I 2024-11-21 22:51:29,432] Trial 3 finished with value: 0.9246160323010578 and parameters: {'fs_method': 'univariate', 'selector__k': 28, 'C': 0.1005523443182414

Best trial:
Value: 0.9530816666194047
Params:
  fs_method: univariate
  selector__k: 24
  C: 1.5620891425954675
  kernel: rbf
  gamma: scale


## RF

In [5]:
best_trials['RF'] = optimize_pipeline(X_train, y_train, 'RF', selectors)

[I 2024-11-21 21:56:56,274] A new study created in memory with name: optimization_RF
[I 2024-11-21 21:57:05,459] Trial 0 finished with value: 0.953321830480524 and parameters: {'fs_method': 'univariate', 'selector__k': 18, 'n_estimators': 121, 'criterion': 'entropy', 'max_depth': 16, 'min_samples_split': 10, 'min_samples_leaf': 2, 'max_features': 'sqrt'}. Best is trial 0 with value: 0.953321830480524.
[I 2024-11-21 21:57:08,823] Trial 1 finished with value: 0.9216018776843928 and parameters: {'fs_method': 'l1', 'selector__C': 0.017071916495414452, 'n_estimators': 189, 'criterion': 'entropy', 'max_depth': 3, 'min_samples_split': 8, 'min_samples_leaf': 3, 'max_features': 'log2'}. Best is trial 0 with value: 0.953321830480524.
[I 2024-11-21 21:57:20,982] Trial 2 finished with value: 0.9582676209235584 and parameters: {'fs_method': 'l1', 'selector__C': 0.08265660752588502, 'n_estimators': 382, 'criterion': 'entropy', 'max_depth': 13, 'min_samples_split': 5, 'min_samples_leaf': 2, 'max_feat

Best trial:
Value: 0.9635746387544344
Params:
  fs_method: univariate
  selector__k: 30
  n_estimators: 366
  criterion: entropy
  max_depth: 20
  min_samples_split: 5
  min_samples_leaf: 2
  max_features: sqrt


## LGBM

In [None]:
best_trials['LGBM'] = optimize_pipeline(X_train, y_train, 'LGBM', selectors)

[I 2024-11-21 22:08:14,124] A new study created in memory with name: optimization_LGBM
[WinError 2] O sistema não pode encontrar o arquivo especificado
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\site-packages\joblib\externals\loky\backend\context.py", line 227, in _count_physical_cores
    cpu_info = subprocess.run(
               ^^^^^^^^^^^^^^^
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\subprocess.py", line 548, in run
    with Popen(*popenargs, **kwargs) as process:
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\subprocess.py", line 1026, in __init__
    self._execute_child(args, executable, preexec_fn, close_fds,
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\subprocess.py", line 1538, in _execute_child
    hp, ht, pid, tid = _winapi.CreateProcess(executable, args,
                       ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000959 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 1275
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 5
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000252 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1275
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 5
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [I

[I 2024-11-21 22:08:15,673] Trial 0 finished with value: 0.9311297590145065 and parameters: {'fs_method': 'pca', 'selector__n_components': 5, 'n_estimators': 99, 'learning_rate': 0.1278381128845586, 'num_leaves': 33, 'max_depth': 17, 'subsample': 0.8200431297622668}. Best is trial 0 with value: 0.9311297590145065.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001469 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 5355
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 21
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001299 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 5355
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 21
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Numb

[I 2024-11-21 22:08:18,289] Trial 1 finished with value: 0.9459646581754964 and parameters: {'fs_method': 'pca', 'selector__n_components': 21, 'n_estimators': 76, 'learning_rate': 0.029024095921595633, 'num_leaves': 70, 'max_depth': 10, 'subsample': 0.9674335210537867}. Best is trial 1 with value: 0.9459646581754964.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001156 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 5610
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 22
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001094 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 5610
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 22
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Numb

[I 2024-11-21 22:08:19,288] Trial 2 finished with value: 0.9259429321804304 and parameters: {'fs_method': 'pca', 'selector__n_components': 22, 'n_estimators': 151, 'learning_rate': 0.03153655601655566, 'num_leaves': 40, 'max_depth': 3, 'subsample': 0.8562197297960389}. Best is trial 1 with value: 0.9459646581754964.


[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001120 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 5610
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 22
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000489 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 27
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 9
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [In

[I 2024-11-21 22:08:27,457] Trial 3 finished with value: 0.9418640583838856 and parameters: {'fs_method': 'univariate', 'selector__k': 9, 'n_estimators': 106, 'learning_rate': 0.04291104160169984, 'num_leaves': 53, 'max_depth': 11, 'subsample': 0.8879199521363214}. Best is trial 1 with value: 0.9459646581754964.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001804 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 86
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 29
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000893 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 86
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 29
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:08:30,316] Trial 4 finished with value: 0.9501866850479637 and parameters: {'fs_method': 'l1', 'selector__C': 0.8632653254494367, 'n_estimators': 81, 'learning_rate': 0.021567656090150062, 'num_leaves': 63, 'max_depth': 11, 'subsample': 0.9568837307286882}. Best is trial 4 with value: 0.9501866850479637.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000588 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 42
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 14
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000504 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 42
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 14
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:08:31,749] Trial 5 finished with value: 0.9532020030378584 and parameters: {'fs_method': 'l1', 'selector__C': 0.015637744512592765, 'n_estimators': 70, 'learning_rate': 0.08286886325171906, 'num_leaves': 46, 'max_depth': 18, 'subsample': 0.8119352604940672}. Best is trial 5 with value: 0.9532020030378584.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001399 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 6630
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 26
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001233 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 6630
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 26
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Numb

[I 2024-11-21 22:08:35,226] Trial 6 finished with value: 0.9581465573968361 and parameters: {'fs_method': 'pca', 'selector__n_components': 26, 'n_estimators': 134, 'learning_rate': 0.03521056697363883, 'num_leaves': 63, 'max_depth': -1, 'subsample': 0.8505107507602928}. Best is trial 6 with value: 0.9581465573968361.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001244 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 68
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 23
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001241 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 68
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 23
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:08:42,474] Trial 7 finished with value: 0.9503065124906295 and parameters: {'fs_method': 'univariate', 'selector__k': 23, 'n_estimators': 67, 'learning_rate': 0.04006610178165756, 'num_leaves': 62, 'max_depth': 9, 'subsample': 0.8885623936753102}. Best is trial 6 with value: 0.9581465573968361.


[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001429 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 69
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 23
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000276 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1785
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 7
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [In

[I 2024-11-21 22:08:42,949] Trial 8 finished with value: 0.923892704995452 and parameters: {'fs_method': 'pca', 'selector__n_components': 7, 'n_estimators': 114, 'learning_rate': 0.11202857254111544, 'num_leaves': 39, 'max_depth': 3, 'subsample': 0.8156592471538073}. Best is trial 6 with value: 0.9581465573968361.


[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000249 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1785
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 7
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000286 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1785
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 7
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Number

[I 2024-11-21 22:08:44,364] Trial 9 finished with value: 0.949582967052543 and parameters: {'fs_method': 'pca', 'selector__n_components': 21, 'n_estimators': 88, 'learning_rate': 0.03326979137378036, 'num_leaves': 63, 'max_depth': 16, 'subsample': 0.9948137889435262}. Best is trial 6 with value: 0.9581465573968361.


[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001035 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 5355
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 21
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000197 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 6
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [In

[I 2024-11-21 22:08:47,189] Trial 10 finished with value: 0.9347486495781681 and parameters: {'fs_method': 'tree', 'selector__n_estimators': 26, 'n_estimators': 199, 'learning_rate': 0.011838591827822929, 'num_leaves': 54, 'max_depth': -1, 'subsample': 0.922113783839205}. Best is trial 6 with value: 0.9581465573968361.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000392 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 27
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 9
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000489 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 30
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 10
[LightGBM] [Info] [binary:Boost

[I 2024-11-21 22:08:48,662] Trial 11 finished with value: 0.9464473853550215 and parameters: {'fs_method': 'l1', 'selector__C': 0.010465681173973144, 'n_estimators': 147, 'learning_rate': 0.07761140085993808, 'num_leaves': 45, 'max_depth': 19, 'subsample': 0.8472895699363021}. Best is trial 6 with value: 0.9581465573968361.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000433 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 27
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 9
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000508 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 33
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 11
[LightGBM] [Info] [binary:Boost

[I 2024-11-21 22:08:50,495] Trial 12 finished with value: 0.9468092671403051 and parameters: {'fs_method': 'l1', 'selector__C': 0.0108162168545878, 'n_estimators': 139, 'learning_rate': 0.07185537210939469, 'num_leaves': 47, 'max_depth': 14, 'subsample': 0.8054214702023358}. Best is trial 6 with value: 0.9581465573968361.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000189 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 6
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000294 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 6
[LightGBM] [Info] [binary:BoostF

[I 2024-11-21 22:09:05,354] Trial 13 finished with value: 0.9363167312702363 and parameters: {'fs_method': 'tree', 'selector__n_estimators': 490, 'n_estimators': 178, 'learning_rate': 0.1855081907448191, 'num_leaves': 56, 'max_depth': 5, 'subsample': 0.8502893983104871}. Best is trial 6 with value: 0.9581465573968361.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000987 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 74
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 25
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000935 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 71
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 24
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:09:07,129] Trial 14 finished with value: 0.9591120117558866 and parameters: {'fs_method': 'l1', 'selector__C': 0.07875546610059078, 'n_estimators': 56, 'learning_rate': 0.07133707541480845, 'num_leaves': 69, 'max_depth': -1, 'subsample': 0.8428903254004113}. Best is trial 14 with value: 0.9591120117558866.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000931 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 27
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001133 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 77
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 26
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:09:09,133] Trial 15 finished with value: 0.9435523310727538 and parameters: {'fs_method': 'l1', 'selector__C': 0.13483464590666028, 'n_estimators': 50, 'learning_rate': 0.0177686027986244, 'num_leaves': 70, 'max_depth': -1, 'subsample': 0.8682574075517842}. Best is trial 14 with value: 0.9591120117558866.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000158 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 6
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000221 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 6
[LightGBM] [Info] [binary:BoostF

[I 2024-11-21 22:09:14,099] Trial 16 finished with value: 0.9264266773115317 and parameters: {'fs_method': 'tree', 'selector__n_estimators': 187, 'n_estimators': 129, 'learning_rate': 0.0637079082909142, 'num_leaves': 59, 'max_depth': 2, 'subsample': 0.9183594721018589}. Best is trial 14 with value: 0.9591120117558866.


[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000216 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 6
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001173 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:Boost

[I 2024-11-21 22:09:21,681] Trial 17 finished with value: 0.9652632749974369 and parameters: {'fs_method': 'univariate', 'selector__k': 30, 'n_estimators': 167, 'learning_rate': 0.05443960166968526, 'num_leaves': 67, 'max_depth': 6, 'subsample': 0.8355113663938957}. Best is trial 17 with value: 0.9652632749974369.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001259 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001053 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:09:29,209] Trial 18 finished with value: 0.9640569296689986 and parameters: {'fs_method': 'univariate', 'selector__k': 30, 'n_estimators': 165, 'learning_rate': 0.056778837902622815, 'num_leaves': 67, 'max_depth': 6, 'subsample': 0.8334495167089551}. Best is trial 17 with value: 0.9652632749974369.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001442 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001556 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:09:37,986] Trial 19 finished with value: 0.9658667021495504 and parameters: {'fs_method': 'univariate', 'selector__k': 30, 'n_estimators': 165, 'learning_rate': 0.054166269925100693, 'num_leaves': 66, 'max_depth': 7, 'subsample': 0.8285990854223357}. Best is trial 19 with value: 0.9658667021495504.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001126 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001699 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:09:46,608] Trial 20 finished with value: 0.9663487749316335 and parameters: {'fs_method': 'univariate', 'selector__k': 30, 'n_estimators': 188, 'learning_rate': 0.052485869588273115, 'num_leaves': 58, 'max_depth': 7, 'subsample': 0.8731825005649948}. Best is trial 20 with value: 0.9663487749316335.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001363 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000876 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:09:55,430] Trial 21 finished with value: 0.967555192970899 and parameters: {'fs_method': 'univariate', 'selector__k': 30, 'n_estimators': 192, 'learning_rate': 0.053279746151217174, 'num_leaves': 59, 'max_depth': 7, 'subsample': 0.8740361214635944}. Best is trial 21 with value: 0.967555192970899.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001959 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001603 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:10:05,489] Trial 22 finished with value: 0.9696054201558775 and parameters: {'fs_method': 'univariate', 'selector__k': 30, 'n_estimators': 193, 'learning_rate': 0.09789602423785873, 'num_leaves': 58, 'max_depth': 8, 'subsample': 0.8743542470902586}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001372 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 68
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 23
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001476 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 69
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 23
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:10:15,135] Trial 23 finished with value: 0.9668317202436395 and parameters: {'fs_method': 'univariate', 'selector__k': 23, 'n_estimators': 198, 'learning_rate': 0.10715538462719064, 'num_leaves': 58, 'max_depth': 8, 'subsample': 0.9079759843132417}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001273 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 62
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 21
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001012 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 62
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 21
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:10:23,649] Trial 24 finished with value: 0.9626099842144795 and parameters: {'fs_method': 'univariate', 'selector__k': 21, 'n_estimators': 199, 'learning_rate': 0.11256518934202721, 'num_leaves': 49, 'max_depth': 13, 'subsample': 0.9122013248787937}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001226 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 24
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001671 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 71
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 24
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:10:34,164] Trial 25 finished with value: 0.9670727566346811 and parameters: {'fs_method': 'univariate', 'selector__k': 24, 'n_estimators': 183, 'learning_rate': 0.1591564757063465, 'num_leaves': 52, 'max_depth': 9, 'subsample': 0.9003786896382282}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000888 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 74
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 25
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001522 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 74
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 25
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:10:44,001] Trial 26 finished with value: 0.9638155297238225 and parameters: {'fs_method': 'univariate', 'selector__k': 25, 'n_estimators': 181, 'learning_rate': 0.1436397941169162, 'num_leaves': 51, 'max_depth': 13, 'subsample': 0.9335524765657792}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001139 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 47
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 16
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001310 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 48
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 16
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:10:51,112] Trial 27 finished with value: 0.9554937755896666 and parameters: {'fs_method': 'univariate', 'selector__k': 16, 'n_estimators': 185, 'learning_rate': 0.19953964419680648, 'num_leaves': 54, 'max_depth': 4, 'subsample': 0.889323859074506}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000799 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 47
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 16
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000901 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 77
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 26
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:11:00,313] Trial 28 finished with value: 0.9685200656433345 and parameters: {'fs_method': 'univariate', 'selector__k': 26, 'n_estimators': 175, 'learning_rate': 0.15444494711951126, 'num_leaves': 60, 'max_depth': 9, 'subsample': 0.8704473132318452}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.002076 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 27
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001527 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 27
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:11:09,104] Trial 29 finished with value: 0.9685199929325077 and parameters: {'fs_method': 'univariate', 'selector__k': 27, 'n_estimators': 156, 'learning_rate': 0.0926133087600812, 'num_leaves': 61, 'max_depth': 12, 'subsample': 0.8737446845308107}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000863 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 50
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 17
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000983 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 51
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 17
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:11:16,669] Trial 30 finished with value: 0.9569414481524543 and parameters: {'fs_method': 'univariate', 'selector__k': 17, 'n_estimators': 155, 'learning_rate': 0.0937426685985294, 'num_leaves': 32, 'max_depth': 16, 'subsample': 0.86296251659862}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001872 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 27
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001600 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 27
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:11:25,829] Trial 31 finished with value: 0.9683998746465345 and parameters: {'fs_method': 'univariate', 'selector__k': 27, 'n_estimators': 172, 'learning_rate': 0.13625278362692672, 'num_leaves': 60, 'max_depth': 11, 'subsample': 0.8753316460534267}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001195 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 77
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 26
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001495 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 78
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 26
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:11:35,542] Trial 32 finished with value: 0.9680371930421556 and parameters: {'fs_method': 'univariate', 'selector__k': 26, 'n_estimators': 172, 'learning_rate': 0.1346068209776003, 'num_leaves': 61, 'max_depth': 11, 'subsample': 0.8846585791173676}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001544 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 27
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001375 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 27
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:11:44,143] Trial 33 finished with value: 0.9686407656159226 and parameters: {'fs_method': 'univariate', 'selector__k': 27, 'n_estimators': 158, 'learning_rate': 0.15610131086178022, 'num_leaves': 56, 'max_depth': 13, 'subsample': 0.8627774655892007}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001849 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 77
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 26
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000890 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 77
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 26
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:11:52,748] Trial 34 finished with value: 0.9692438292139013 and parameters: {'fs_method': 'univariate', 'selector__k': 26, 'n_estimators': 156, 'learning_rate': 0.16435920165465964, 'num_leaves': 56, 'max_depth': 13, 'subsample': 0.8623172436430803}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000731 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 60
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 20
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001184 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 60
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 20
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:12:00,908] Trial 35 finished with value: 0.9577854027198212 and parameters: {'fs_method': 'univariate', 'selector__k': 20, 'n_estimators': 144, 'learning_rate': 0.16828518246975277, 'num_leaves': 56, 'max_depth': 15, 'subsample': 0.8615174825930493}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000158 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 6
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000135 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 6
[LightGBM] [Info] [binary:BoostF

[I 2024-11-21 22:12:04,109] Trial 36 finished with value: 0.9363167312702363 and parameters: {'fs_method': 'tree', 'selector__n_estimators': 13, 'n_estimators': 158, 'learning_rate': 0.15678118991767995, 'num_leaves': 56, 'max_depth': 10, 'subsample': 0.9000554578171666}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001974 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 27
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000988 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 81
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 27
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:12:13,214] Trial 37 finished with value: 0.9683992929599196 and parameters: {'fs_method': 'univariate', 'selector__k': 27, 'n_estimators': 123, 'learning_rate': 0.1233118835002912, 'num_leaves': 65, 'max_depth': 13, 'subsample': 0.8584986358820272}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000874 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3315
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 13
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000743 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3315
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 13
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Numb

[I 2024-11-21 22:12:32,173] Trial 38 finished with value: 0.9591121571775402 and parameters: {'fs_method': 'pca', 'selector__n_components': 13, 'n_estimators': 176, 'learning_rate': 0.18167227438089198, 'num_leaves': 49, 'max_depth': 10, 'subsample': 0.9452884440695493}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000991 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 42
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 14
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001120 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 42
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 14
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:12:40,415] Trial 39 finished with value: 0.9516345757432318 and parameters: {'fs_method': 'univariate', 'selector__k': 14, 'n_estimators': 118, 'learning_rate': 0.09591055509607878, 'num_leaves': 43, 'max_depth': 17, 'subsample': 0.8840071188131501}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001362 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 27
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001521 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 27
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:12:48,199] Trial 40 finished with value: 0.9662285112240069 and parameters: {'fs_method': 'univariate', 'selector__k': 27, 'n_estimators': 97, 'learning_rate': 0.1227323306116656, 'num_leaves': 36, 'max_depth': 12, 'subsample': 0.8243673777671556}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001091 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 27
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001885 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 80
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 27
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:13:06,691] Trial 41 finished with value: 0.9676758929434868 and parameters: {'fs_method': 'univariate', 'selector__k': 27, 'n_estimators': 161, 'learning_rate': 0.09089153091907123, 'num_leaves': 57, 'max_depth': 12, 'subsample': 0.856086239489726}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001400 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 83
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 28
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000962 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 83
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 28
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:13:15,479] Trial 42 finished with value: 0.9673135021824155 and parameters: {'fs_method': 'univariate', 'selector__k': 28, 'n_estimators': 155, 'learning_rate': 0.1535698576473712, 'num_leaves': 54, 'max_depth': 14, 'subsample': 0.8413094529536447}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000859 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 62
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 21
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001136 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 62
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 21
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:13:35,234] Trial 43 finished with value: 0.9630924932615242 and parameters: {'fs_method': 'univariate', 'selector__k': 21, 'n_estimators': 139, 'learning_rate': 0.10054591309489093, 'num_leaves': 61, 'max_depth': 9, 'subsample': 0.8805026633317007}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000739 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3315
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 13
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000874 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 3315
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 13
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Numb

[I 2024-11-21 22:13:39,279] Trial 44 finished with value: 0.9580264391108629 and parameters: {'fs_method': 'pca', 'selector__n_components': 13, 'n_estimators': 148, 'learning_rate': 0.12308478965410462, 'num_leaves': 64, 'max_depth': 12, 'subsample': 0.8938492131966824}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001968 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 75
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 25
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000953 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 74
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 25
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:13:50,529] Trial 45 finished with value: 0.967072902056335 and parameters: {'fs_method': 'univariate', 'selector__k': 25, 'n_estimators': 191, 'learning_rate': 0.08218204050498273, 'num_leaves': 62, 'max_depth': 20, 'subsample': 0.8667405836782768}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000924 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 71
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 24
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001734 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 72
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 24
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:14:01,824] Trial 46 finished with value: 0.9669527837703618 and parameters: {'fs_method': 'univariate', 'selector__k': 24, 'n_estimators': 172, 'learning_rate': 0.1727972661196483, 'num_leaves': 55, 'max_depth': 15, 'subsample': 0.8535405904299547}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000167 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 6
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000258 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 18
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 6
[LightGBM] [Info] [binary:BoostF

[I 2024-11-21 22:14:06,874] Trial 47 finished with value: 0.9363167312702363 and parameters: {'fs_method': 'tree', 'selector__n_estimators': 64, 'n_estimators': 151, 'learning_rate': 0.19591982085099463, 'num_leaves': 52, 'max_depth': 8, 'subsample': 0.8965541651230662}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001529 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 7140
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 28
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001346 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 7140
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 28
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Info] Start training from score 0.208501
[LightGBM] [Info] Numb

[I 2024-11-21 22:14:10,373] Trial 48 finished with value: 0.9513918670031722 and parameters: {'fs_method': 'pca', 'selector__n_components': 28, 'n_estimators': 131, 'learning_rate': 0.021394948684401213, 'num_leaves': 60, 'max_depth': 11, 'subsample': 0.9946776661680679}. Best is trial 22 with value: 0.9696054201558775.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001578 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 86
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 29
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001129 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 86
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 29
[LightGBM] [Info] [binary:Boos

[I 2024-11-21 22:14:15,114] Trial 49 finished with value: 0.9682788111198122 and parameters: {'fs_method': 'l1', 'selector__C': 0.8591690781638281, 'n_estimators': 143, 'learning_rate': 0.14193812084764795, 'num_leaves': 63, 'max_depth': 14, 'subsample': 0.8782956282076986}. Best is trial 22 with value: 0.9696054201558775.


Best trial:
Value: 0.9696054201558775
Params:
  fs_method: univariate
  selector__k: 30
  n_estimators: 193
  learning_rate: 0.09789602423785873
  num_leaves: 58
  max_depth: 8
  subsample: 0.8743542470902586


## XGB

In [5]:
best_trials['XGB'] = optimize_pipeline(X_train, y_train, 'XGB', selectors)

[I 2024-11-21 22:10:51,681] A new study created in memory with name: optimization_XGB
[I 2024-11-21 22:11:03,551] Trial 0 finished with value: 0.9575437119313378 and parameters: {'fs_method': 'l1', 'selector__C': 0.12067639885647719, 'learning_rate': 0.019343816041326695, 'loss': 'exponential', 'n_estimators': 396, 'max_depth': 5, 'subsample': 0.3417049121661013, 'criterion': 'friedman_mse'}. Best is trial 0 with value: 0.9575437119313378.
[I 2024-11-21 22:11:31,802] Trial 1 finished with value: 0.9576649935905406 and parameters: {'fs_method': 'univariate', 'selector__k': 15, 'learning_rate': 0.029135112273171934, 'loss': 'log_loss', 'n_estimators': 497, 'max_depth': 6, 'subsample': 0.7282581301497698, 'criterion': 'squared_error'}. Best is trial 1 with value: 0.9576649935905406.
[I 2024-11-21 22:11:40,292] Trial 2 finished with value: 0.9341452951368818 and parameters: {'fs_method': 'tree', 'selector__n_estimators': 52, 'learning_rate': 0.013752764983583488, 'loss': 'log_loss', 'n_est

Best trial:
Value: 0.9697260474176386
Params:
  fs_method: l1
  selector__C: 0.9914381669879291
  learning_rate: 0.08992474985284606
  loss: log_loss
  n_estimators: 202
  max_depth: 6
  subsample: 0.7216503855619084
  criterion: squared_error


## MLP

In [5]:
best_trials['MLP'] = optimize_pipeline(X_train, y_train, 'MLP', selectors)

[I 2024-11-24 15:17:13,616] A new study created in memory with name: optimization_MLP
[I 2024-11-24 15:17:38,785] Trial 0 finished with value: 0.9312490774813842 and parameters: {'fs_method': 'l1', 'selector__C': 0.10077469594973242, 'hidden_layer_sizes': '(100,)', 'activation': 'tanh', 'solver': 'sgd', 'alpha': 0.0045950602966433034}. Best is trial 0 with value: 0.9312490774813842.
[I 2024-11-24 15:18:11,453] Trial 1 finished with value: 0.9317323136366975 and parameters: {'fs_method': 'pca', 'selector__n_components': 16, 'hidden_layer_sizes': '(50,)', 'activation': 'logistic', 'solver': 'adam', 'alpha': 0.0015234905768834524}. Best is trial 1 with value: 0.9317323136366975.
STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
  self.n_iter_ = _check_optimize_result("lbfgs", opt_res, self.max_iter)
STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase th

Best trial:
Value: 0.9667115292468393
Params:
  fs_method: pca
  selector__n_components: 28
  hidden_layer_sizes: (100, 50)
  activation: relu
  solver: adam
  alpha: 0.002934783816887241


## Best pipelines for individual models

In [5]:
import random
import optuna
from sklearn.discriminant_analysis import StandardScaler
from sklearn.model_selection import cross_val_score, StratifiedKFold
from sklearn.neural_network import MLPClassifier
from sklearn.pipeline import Pipeline
from sklearn.feature_selection import SelectFromModel, SelectKBest, mutual_info_classif
from sklearn.decomposition import PCA
from sklearn.ensemble import RandomForestClassifier, StackingClassifier
from sklearn.linear_model import LogisticRegression
from lightgbm import LGBMClassifier
from sklearn.ensemble import GradientBoostingClassifier, RandomForestClassifier, StackingClassifier, VotingClassifier
from sklearn.neighbors import KNeighborsClassifier
from sklearn.neural_network import MLPClassifier
from sklearn.svm import SVC
from sklearn.tree import DecisionTreeClassifier
from lvq_classifier import LVQ
from itertools import combinations

In [6]:
best_pipelines = {
    'KNN': Pipeline([
            ("selector", SelectFromModel(LogisticRegression(solver='liblinear', 
                                                            penalty='l1', 
                                                            C=0.335))),
            ("model", KNeighborsClassifier(n_neighbors=5,
                                           weights='distance',
                                           algorithm='auto',
                                           metric='manhattan'))
            ]),

    'LVQ': Pipeline([
            ("selector", PCA(n_components=25)),
            ("model", LVQ(n_codebooks=15,lrate=0.24,epochs=20))
            ]),

    'DTR': Pipeline([
            ("selector", SelectFromModel(RandomForestClassifier(n_estimators=112))),
            ("model", DecisionTreeClassifier(criterion='entropy',
                                             splitter='random',
                                             max_depth=11, 
                                             min_samples_split=4,
                                             min_samples_leaf=2,
                                             max_features='log2'))
            ]),

    'SVM': Pipeline([
            ("scaler", StandardScaler()),
            ("selector", SelectKBest(mutual_info_classif, k=24)),
            ("model", SVC(probability=True, 
                          max_iter=1000, 
                          C=1.562,
                          kernel='rbf',
                          gamma='scale'))
            ]),

    'RF': Pipeline([
            ("selector", SelectKBest(mutual_info_classif, k=30)),
            ("model", RandomForestClassifier(n_estimators=366,
                                             criterion='entropy',
                                             max_depth=20, 
                                             min_samples_split=5,
                                             min_samples_leaf=2, 
                                             max_features='sqrt'))
            ]),

    'XGB': Pipeline([
            ("selector", SelectFromModel(LogisticRegression(solver='liblinear', 
                                                            penalty='l1', 
                                                            C=0.99))),
            ("model", GradientBoostingClassifier(learning_rate=0.09,
                                                 loss='log_loss',
                                                 n_estimators=202,
                                                 max_depth=6, 
                                                 subsample=0.72, 
                                                 criterion='squared_error'))
            ]),

    'LGBM': Pipeline([
            ("selector", SelectKBest(mutual_info_classif, k=30)),
            ("model", LGBMClassifier(n_estimators=193,
                                     learning_rate=0.098,
                                     num_leaves=58,
                                     max_depth=8,
                                     subsample=0.87))
            ]),

    'MLP': Pipeline([
            ("scaler", StandardScaler()),
            ("selector", PCA(n_components=28) ),
            ("model", MLPClassifier(hidden_layer_sizes=(100,50),
                                    activation='relu',
                                    solver='adam',
                                    alpha=0.002935,
                                    max_iter=200))
            ])
} 

## ANNs Ensemble

### Stacking

#### 2 ANNs

In [16]:
n_members = 2

ann_models = [best_pipelines['MLP'] for _ in range(n_members)]

estimators = [(f'ann_{i+1}', model) for i, model in enumerate(ann_models)]

# Create a stacking ensemble with ANN models
ann_stack_2 = StackingClassifier(
    estimators=estimators,
    final_estimator=LogisticRegression()
)

In [17]:
cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
scores = cross_val_score(ann_stack_2, X_train, y_train, cv=cv, scoring='accuracy')

In [18]:
scores

array([0.96624473, 0.96139928, 0.96200241, 0.973462  , 0.9668275 ])

In [30]:
print(f'Mean accuracy: {round(scores.mean() * 100, 2)}% ± {round(scores.std() * 100, 2)}')

Mean accuracy: 96.6% ± 0.43


#### 3 ANNs

In [19]:
n_members = 3

ann_models = [best_pipelines['MLP'] for _ in range(n_members)]

estimators = [(f'ann_{i+1}', model) for i, model in enumerate(ann_models)]

# Create a stacking ensemble with ANN models
ann_stack_3 = StackingClassifier(
    estimators=estimators,
    final_estimator=LogisticRegression()
)

cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
scores = cross_val_score(ann_stack_3, X_train, y_train, cv=cv, scoring='accuracy')



In [20]:
scores

array([0.95840868, 0.96200241, 0.96139928, 0.97044632, 0.96622437])

In [None]:
print(f'Mean accuracy: {round(scores.mean() * 100, 2)}% ± {round(scores.std() * 100, 2)}')

Mean accuracy: 96.37% ± 0.42


### Voting

#### 2 ANNs

In [31]:
n_members = 2

ann_models = [best_pipelines['MLP'] for _ in range(n_members)]

estimators = [(f'ann_{i+1}', model) for i, model in enumerate(ann_models)]

# Create a stacking ensemble with ANN models
ann_stack_2 = VotingClassifier(
    estimators=estimators,
    voting='soft'
)

cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
scores = cross_val_score(ann_stack_2, X_train, y_train, cv=cv, scoring='accuracy')

In [32]:
scores

array([0.96323086, 0.96139928, 0.96200241, 0.973462  , 0.96803378])

In [37]:
print(f'Mean accuracy: {round(scores.mean() * 100, 2)}% ± {round(scores.std() * 100, 2)}')

Mean accuracy: 96.56% ± 0.46


#### 3 ANNS

In [33]:
n_members = 3

ann_models = [best_pipelines['MLP'] for _ in range(n_members)]

estimators = [(f'ann_{i+1}', model) for i, model in enumerate(ann_models)]

# Create a stacking ensemble with ANN models
ann_stack_3 = VotingClassifier(
    estimators=estimators,
    voting='soft'
)

cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
scores = cross_val_score(ann_stack_3, X_train, y_train, cv=cv, scoring='accuracy')

In [34]:
scores

array([0.96323086, 0.95898673, 0.96260555, 0.97587455, 0.97104946])

In [35]:
print(f'Mean accuracy: {round(scores.mean() * 100, 2)}% ± {round(scores.std() * 100, 2)}')

Mean accuracy: 96.63% ± 0.62


#### 4 ANNs

In [38]:
n_members = 4

ann_models = [best_pipelines['MLP'] for _ in range(n_members)]

estimators = [(f'ann_{i+1}', model) for i, model in enumerate(ann_models)]

# Create a stacking ensemble with ANN models
ann_stack_3 = VotingClassifier(
    estimators=estimators,
    voting='soft'
)

cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
scores = cross_val_score(ann_stack_3, X_train, y_train, cv=cv, scoring='accuracy')

In [39]:
scores

array([0.96081977, 0.96139928, 0.96501809, 0.973462  , 0.97225573])

In [40]:
print(f'Mean accuracy: {round(scores.mean() * 100, 2)}% ± {round(scores.std() * 100, 2)}')

Mean accuracy: 96.66% ± 0.53


## Heterogeneous Voting Ensemble

In [None]:
pipelines_to_test = best_pipelines.copy()
models_to_delete = ['MLP','LVQ','DTR','SVM']
for model_name in models_to_delete:
    pipelines_to_test.pop(model_name)
print(pipelines_to_test.keys())

dict_keys(['KNN', 'RF', 'XGB', 'LGBM'])


In [None]:
model_names = list(pipelines_to_test.keys())

    # Generate all possible subsets of models
all_combinations = [
    list(combo) for r in range(2, 5)
    for combo in combinations(model_names, r)
]

all_combinations

[['KNN', 'RF'],
 ['KNN', 'XGB'],
 ['KNN', 'LGBM'],
 ['RF', 'XGB'],
 ['RF', 'LGBM'],
 ['XGB', 'LGBM'],
 ['KNN', 'RF', 'XGB'],
 ['KNN', 'RF', 'LGBM'],
 ['KNN', 'XGB', 'LGBM'],
 ['RF', 'XGB', 'LGBM'],
 ['KNN', 'RF', 'XGB', 'LGBM']]

In [None]:
import warnings

def optimize_voting_model(X, y, pipelines_to_test, n_trials=30, cv_folds=5, scoring='accuracy'):
    """
    Optimize a voting ensemble with 2 to 4 classifier pipelines.

    Parameters:
    - X (pd.DataFrame): Feature matrix.
    - y (pd.Series): Target vector.
    - pipelines_to_test (dict): dictionary with the model names as keys and the classifier pipelines as items.
    - n_trials (int): Number of optimization trials.
    - cv_folds (int): Number of cross-validation folds.
    - scoring (str): Scoring metric for cross-validation.

    Returns:
    - study.best_trial: The best trial from the optimization study.
    """
    warnings.filterwarnings('ignore')
    model_names = list(pipelines_to_test.keys())

    # Generate all possible subsets of models
    all_combinations = [
        list(combo) for r in range(2, 5)
        for combo in combinations(model_names, r)
    ]

    print(f'All these combinations will be tested: {all_combinations}')

    def objective(trial):
        # Select a combination of models
        selected_models = trial.suggest_categorical('model_combination', all_combinations)
        ensemble_type = trial.suggest_categorical('ensemble_type', ['voting','stack'])

        # Build the VotingClassifier with the selected models
        estimators = [
            (f'pipeline_{i+1}', best_pipelines[model])
            for i, model in enumerate(selected_models)
        ]

        if ensemble_type == 'voting':
            ensemble = VotingClassifier(estimators=estimators, voting='soft')
        else:
            ensemble = StackingClassifier(estimators=estimators,final_estimator=LogisticRegression())

        # Perform cross-validation
        cv = StratifiedKFold(n_splits=cv_folds, shuffle=True, random_state=42)
        scores = cross_val_score(ensemble, X, y, cv=cv, scoring=scoring, error_score='raise')
        return scores.mean()

    # Create and run the Optuna study
    study = optuna.create_study(study_name=f'optimization_voting_model', direction="maximize")
    study.optimize(objective, n_trials=n_trials)

    # Print the best trial
    print("Best trial:")
    print(f"Value: {study.best_trial.value}")
    print("Params:")
    for key, value in study.best_trial.params.items():
        print(f"  {key}: {value}")

    return study.best_trial

In [None]:
optimize_voting_model(X_train, y_train, pipelines_to_test, n_trials=50)

[I 2024-11-24 17:46:40,574] A new study created in memory with name: optimization_voting_model


All these combinations will be tested: [['KNN', 'RF'], ['KNN', 'XGB'], ['KNN', 'LGBM'], ['RF', 'XGB'], ['RF', 'LGBM'], ['XGB', 'LGBM'], ['KNN', 'RF', 'XGB'], ['KNN', 'RF', 'LGBM'], ['KNN', 'XGB', 'LGBM'], ['RF', 'XGB', 'LGBM'], ['KNN', 'RF', 'XGB', 'LGBM']]


  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\site-packages\joblib\externals\loky\backend\context.py", line 227, in _count_physical_cores
    cpu_info = subprocess.run(
               ^^^^^^^^^^^^^^^
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\subprocess.py", line 548, in run
    with Popen(*popenargs, **kwargs) as process:
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\subprocess.py", line 1026, in __init__
    self._execute_child(args, executable, preexec_fn, close_fds,
  File "c:\Users\giull\AppData\Local\Programs\Python\Python312\Lib\subprocess.py", line 1538, in _execute_child
    hp, ht, pid, tid = _winapi.CreateProcess(executable, args,
                       ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000651 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 2928, number of negative: 2377
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000457 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 5305, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:48:09,643] Trial 0 finished with value: 0.9677963747835945 and parameters: {'model_combination': ['KNN', 'RF', 'XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 0 with value: 0.9677963747835945.
[I 2024-11-24 17:49:48,727] Trial 1 finished with value: 0.9690024292687254 and parameters: {'model_combination': ['KNN', 'RF', 'XGB'], 'ensemble_type': 'stack'}. Best is trial 1 with value: 0.9690024292687254.
[I 2024-11-24 17:50:03,485] Trial 2 finished with value: 0.968881874717791 and parameters: {'model_combination': ['RF', 'XGB'], 'ensemble_type': 'voting'}. Best is trial 1 with value: 0.9690024292687254.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000635 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000638 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:50:17,633] Trial 3 finished with value: 0.9704496655665519 and parameters: {'model_combination': ['KNN', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.
[I 2024-11-24 17:51:35,395] Trial 4 finished with value: 0.9683995110924002 and parameters: {'model_combination': ['RF', 'XGB'], 'ensemble_type': 'stack'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000675 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000558 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:51:55,869] Trial 5 finished with value: 0.9700882927570564 and parameters: {'model_combination': ['RF', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000658 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000741 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:52:18,072] Trial 6 finished with value: 0.9688817292961375 and parameters: {'model_combination': ['KNN', 'RF', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000678 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000593 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:52:25,002] Trial 7 finished with value: 0.9688815111636568 and parameters: {'model_combination': ['KNN', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.
[I 2024-11-24 17:53:09,596] Trial 8 finished with value: 0.9673135021824155 and parameters: {'model_combination': ['KNN', 'RF'], 'ensemble_type': 'stack'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000665 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000678 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:53:22,726] Trial 9 finished with value: 0.9688820928502716 and parameters: {'model_combination': ['RF', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000666 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000640 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:53:37,024] Trial 10 finished with value: 0.9694847928941164 and parameters: {'model_combination': ['KNN', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000645 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000577 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:53:57,196] Trial 11 finished with value: 0.9694851564482507 and parameters: {'model_combination': ['RF', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000658 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000525 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:54:10,239] Trial 12 finished with value: 0.9700881473354027 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000625 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000799 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:54:31,859] Trial 13 finished with value: 0.9694852291590775 and parameters: {'model_combination': ['RF', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000780 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000740 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:54:46,579] Trial 14 finished with value: 0.9699671565195072 and parameters: {'model_combination': ['KNN', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000748 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000578 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:55:01,251] Trial 15 finished with value: 0.969846529257746 and parameters: {'model_combination': ['KNN', 'RF', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.
[I 2024-11-24 17:55:10,239] Trial 16 finished with value: 0.969725829285158 and parameters: {'model_combination': ['KNN', 'XGB'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000696 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000595 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:55:25,387] Trial 17 finished with value: 0.9694846474724625 and parameters: {'model_combination': ['KNN', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000684 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 2928, number of negative: 2377
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000561 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 5305, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:57:15,475] Trial 18 finished with value: 0.9686407656159226 and parameters: {'model_combination': ['RF', 'XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 3 with value: 0.9704496655665519.
[I 2024-11-24 17:57:32,022] Trial 19 finished with value: 0.9700877837812684 and parameters: {'model_combination': ['KNN', 'RF', 'XGB'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000642 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000770 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:57:46,536] Trial 20 finished with value: 0.9699671565195072 and parameters: {'model_combination': ['KNN', 'RF', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000784 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000663 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:57:59,476] Trial 21 finished with value: 0.9691231292413134 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000724 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000748 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Inf

[I 2024-11-24 17:58:12,521] Trial 22 finished with value: 0.9696059291316654 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000497 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000636 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:58:25,337] Trial 23 finished with value: 0.9700882200462295 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.
[I 2024-11-24 17:58:34,403] Trial 24 finished with value: 0.9697259019959847 and parameters: {'model_combination': ['KNN', 'XGB'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000658 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000799 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:58:48,094] Trial 25 finished with value: 0.9690026474012059 and parameters: {'model_combination': ['RF', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000736 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 2928, number of negative: 2377
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000560 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 5305, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:59:25,520] Trial 26 finished with value: 0.9693643110540089 and parameters: {'model_combination': ['KNN', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 3 with value: 0.9704496655665519.
[I 2024-11-24 17:59:34,903] Trial 27 finished with value: 0.9655043113884787 and parameters: {'model_combination': ['KNN', 'RF'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000704 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000713 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 17:59:49,345] Trial 28 finished with value: 0.9694846474724625 and parameters: {'model_combination': ['KNN', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000664 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 2928, number of negative: 2377
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000510 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 5305, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 18:02:40,752] Trial 29 finished with value: 0.9679170020453556 and parameters: {'model_combination': ['KNN', 'RF', 'XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000658 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000687 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 18:03:02,856] Trial 30 finished with value: 0.969726338260946 and parameters: {'model_combination': ['RF', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000661 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005619 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 18:03:35,350] Trial 31 finished with value: 0.9703294745697517 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 3 with value: 0.9704496655665519.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.002506 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002460 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551937 -> initscore=0.208501
[LightGBM] [Inf

[I 2024-11-24 18:03:58,667] Trial 32 finished with value: 0.970570801804101 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 32 with value: 0.970570801804101.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000622 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000559 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 18:04:12,268] Trial 33 finished with value: 0.9698469655227072 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 32 with value: 0.970570801804101.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000663 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 2928, number of negative: 2377
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000671 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 5305, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 18:05:52,457] Trial 34 finished with value: 0.9694850837374238 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'stack'}. Best is trial 32 with value: 0.970570801804101.
[I 2024-11-24 18:06:12,483] Trial 35 finished with value: 0.9675551202600723 and parameters: {'model_combination': ['RF', 'XGB'], 'ensemble_type': 'voting'}. Best is trial 32 with value: 0.970570801804101.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000676 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000539 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 18:06:28,538] Trial 36 finished with value: 0.969847038233534 and parameters: {'model_combination': ['XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 32 with value: 0.970570801804101.
[I 2024-11-24 18:07:02,272] Trial 37 finished with value: 0.9704496655665519 and parameters: {'model_combination': ['KNN', 'RF', 'XGB'], 'ensemble_type': 'voting'}. Best is trial 32 with value: 0.970570801804101.
[I 2024-11-24 18:09:47,957] Trial 38 finished with value: 0.9681578203039166 and parameters: {'model_combination': ['KNN', 'RF', 'XGB'], 'ensemble_type': 'stack'}. Best is trial 32 with value: 0.970570801804101.
[I 2024-11-24 18:10:27,858] Trial 39 finished with value: 0.9706909200900741 and parameters: {'model_combination': ['KNN', 'RF', 'XGB'], 'ensemble_type': 'voting'}. Best is trial 39 with value: 0.9706909200900741.
[I 2024-11-24 18:11:48,526] Trial 40 finished with value: 0.969002138425418 and parameters: {'model_combination': ['KNN', 'RF', 'XGB'], 'ensemble_type': '

[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001070 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001315 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 18:17:04,126] Trial 47 finished with value: 0.9708114746410084 and parameters: {'model_combination': ['KNN', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 43 with value: 0.971173356426292.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001406 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001071 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 18:17:32,226] Trial 48 finished with value: 0.9688815111636568 and parameters: {'model_combination': ['KNN', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 43 with value: 0.971173356426292.


[LightGBM] [Info] Number of positive: 3660, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001442 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6632, number of used features: 30
[LightGBM] [Info] [binary:BoostFromScore]: pavg=0.551870 -> initscore=0.208228
[LightGBM] [Info] Start training from score 0.208228
[LightGBM] [Info] Number of positive: 3661, number of negative: 2972
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.001273 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 89
[LightGBM] [Info] Number of data points in the train set: 6633, number of used features: 30
[LightGBM] [Info] [binary:Boos

[I 2024-11-24 18:18:24,488] Trial 49 finished with value: 0.9699673019411609 and parameters: {'model_combination': ['KNN', 'RF', 'XGB', 'LGBM'], 'ensemble_type': 'voting'}. Best is trial 43 with value: 0.971173356426292.


Best trial:
Value: 0.971173356426292
Params:
  model_combination: ['KNN', 'RF', 'XGB']
  ensemble_type: voting


FrozenTrial(number=43, state=1, values=[0.971173356426292], datetime_start=datetime.datetime(2024, 11, 24, 18, 13, 50, 717205), datetime_complete=datetime.datetime(2024, 11, 24, 18, 14, 44, 350934), params={'model_combination': ['KNN', 'RF', 'XGB'], 'ensemble_type': 'voting'}, user_attrs={}, system_attrs={}, intermediate_values={}, distributions={'model_combination': CategoricalDistribution(choices=(['KNN', 'RF'], ['KNN', 'XGB'], ['KNN', 'LGBM'], ['RF', 'XGB'], ['RF', 'LGBM'], ['XGB', 'LGBM'], ['KNN', 'RF', 'XGB'], ['KNN', 'RF', 'LGBM'], ['KNN', 'XGB', 'LGBM'], ['RF', 'XGB', 'LGBM'], ['KNN', 'RF', 'XGB', 'LGBM'])), 'ensemble_type': CategoricalDistribution(choices=('voting', 'stack'))}, trial_id=43, value=None)