In [1]:
import numpy as np
import polars as pl
import pandas as pd
from sklearn.base import clone
from copy import deepcopy
import optuna
from scipy.optimize import minimize
import os
import matplotlib.pyplot as plt
import seaborn as sns

import re
from colorama import Fore, Style
from sklearn.metrics import accuracy_score
from tqdm import tqdm
from IPython.display import clear_output
from concurrent.futures import ThreadPoolExecutor

import warnings
warnings.filterwarnings('ignore')
pd.options.display.max_columns = None

import lightgbm as lgb
from catboost import CatBoostRegressor, CatBoostClassifier
from xgboost import XGBRegressor
from sklearn.ensemble import VotingRegressor
from sklearn.model_selection import *
from sklearn.metrics import *

# Preparing the data



Because some standard machine learning models cannot natively handle time series data, we have to transform time series data into a vector by extracting summary statistic to simplifies data representation and less computational complexity

In [2]:
def process_file(filename, dirname):
    df = pd.read_parquet(os.path.join(dirname, filename, 'part-0.parquet')) 
    # Read all parquet files that ends with part-0.parquet in series-train.parquet directory
    df.drop('step', axis=1, inplace=True)
    return df.describe().values.reshape(-1), filename.split('=')[1]

def load_time_series(dirname) -> pd.DataFrame:
    ids = os.listdir(dirname)
    
    with ThreadPoolExecutor() as executor:
        results = list(tqdm(executor.map(lambda fname: process_file(fname, dirname), ids), total=len(ids)))
    # results is a tuple of statistic value with its id, like ([10.5, 20.3, 15.7], '001'),([12.1, 18.6, 14],'002')  
    stats, indexes = zip(*results)
    # now stats hold [10.5, 20.3, 15.7],... and indexes hold 001, 002,..
    df = pd.DataFrame(stats, columns=[f"Stat_{i}" for i in range(len(stats[0]))])
    df['id'] = indexes
    
    return df

train = pd.read_csv('/kaggle/input/child-mind-institute-problematic-internet-use/train.csv')
test = pd.read_csv('/kaggle/input/child-mind-institute-problematic-internet-use/test.csv')
sample = pd.read_csv('/kaggle/input/child-mind-institute-problematic-internet-use/sample_submission.csv')

train_ts = load_time_series("/kaggle/input/child-mind-institute-problematic-internet-use/series_train.parquet")
test_ts = load_time_series("/kaggle/input/child-mind-institute-problematic-internet-use/series_test.parquet")

100%|██████████| 996/996 [01:09<00:00, 14.34it/s]
100%|██████████| 2/2 [00:00<00:00, 12.53it/s]


In [3]:
time_series_cols = train_ts.columns.tolist()
time_series_cols.remove("id")

In [4]:
train = pd.merge(train, train_ts, how="left", on='id')
test = pd.merge(test, test_ts, how="left", on='id')
#We merge because train and train_ts, both of them have rows that correspond to a single child (with id)

In [5]:
# After merging we drop it cause we no longer need it
train = train.drop('id', axis=1)
test = test.drop('id', axis=1)

Dropping all the PCIAT-related columns because they are not in the test set

In [6]:
featuresCols = [
                'Basic_Demos-Enroll_Season', 'Basic_Demos-Age', 'Basic_Demos-Sex',
                'CGAS-Season', 'CGAS-CGAS_Score', 'Physical-Season', 'Physical-BMI',
                'Physical-Height', 'Physical-Weight', 'Physical-Waist_Circumference',
                'Physical-Diastolic_BP', 'Physical-HeartRate', 'Physical-Systolic_BP',
                'Fitness_Endurance-Season',
                'Fitness_Endurance-Max_Stage','Fitness_Endurance-Time_Mins', 'Fitness_Endurance-Time_Sec',
                'FGC-Season', 'FGC-FGC_CU', 'FGC-FGC_CU_Zone', 'FGC-FGC_GSND',
                'FGC-FGC_GSND_Zone', 'FGC-FGC_GSD', 'FGC-FGC_GSD_Zone', 'FGC-FGC_PU',
                'FGC-FGC_PU_Zone', 'FGC-FGC_SRL', 'FGC-FGC_SRL_Zone', 'FGC-FGC_SRR',
                'FGC-FGC_SRR_Zone', 'FGC-FGC_TL', 'FGC-FGC_TL_Zone', 'BIA-Season',
                'BIA-BIA_Activity_Level_num', 'BIA-BIA_BMC', 'BIA-BIA_BMI',
                'BIA-BIA_BMR', 'BIA-BIA_DEE', 'BIA-BIA_ECW', 'BIA-BIA_FFM',
                'BIA-BIA_FFMI', 'BIA-BIA_FMI', 'BIA-BIA_Fat', 'BIA-BIA_Frame_num',
                'BIA-BIA_ICW', 'BIA-BIA_LDM', 'BIA-BIA_LST', 'BIA-BIA_SMM',
                'BIA-BIA_TBW', 
                'PAQ_A-Season', 'PAQ_A-PAQ_A_Total', 
                'PAQ_C-Season',
                'PAQ_C-PAQ_C_Total', 'SDS-Season', 'SDS-SDS_Total_Raw',
                'SDS-SDS_Total_T', 'PreInt_EduHx-Season',
                'PreInt_EduHx-computerinternet_hoursday', 'sii']

In [7]:
featuresCols += time_series_cols

In [8]:
train = train[featuresCols]

# Handling missing values

We are dropping features that have more than 80% missing values

In [9]:
threshold = 0.8
target = train['sii']
train = train[[col for col in train.columns if col != 'sii']].dropna(axis=1, thresh=(1 - threshold) * len(train))
test = test[train.columns] 
train['sii'] = target

# Removing Outliers

Replacing outliers in CGAS-CGAS_Score with NaN value

In [10]:
train[train['CGAS-CGAS_Score'] > 100]

Unnamed: 0,Basic_Demos-Enroll_Season,Basic_Demos-Age,Basic_Demos-Sex,CGAS-Season,CGAS-CGAS_Score,Physical-Season,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Season,FGC-Season,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-Season,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_C-Season,PAQ_C-PAQ_C_Total,SDS-Season,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-Season,PreInt_EduHx-computerinternet_hoursday,Stat_0,Stat_1,Stat_2,Stat_3,Stat_4,Stat_5,Stat_6,Stat_7,Stat_8,Stat_9,Stat_10,Stat_11,Stat_12,Stat_13,Stat_14,Stat_15,Stat_16,Stat_17,Stat_18,Stat_19,Stat_20,Stat_21,Stat_22,Stat_23,Stat_24,Stat_25,Stat_26,Stat_27,Stat_28,Stat_29,Stat_30,Stat_31,Stat_32,Stat_33,Stat_34,Stat_35,Stat_36,Stat_37,Stat_38,Stat_39,Stat_40,Stat_41,Stat_42,Stat_43,Stat_44,Stat_45,Stat_46,Stat_47,Stat_48,Stat_49,Stat_50,Stat_51,Stat_52,Stat_53,Stat_54,Stat_55,Stat_56,Stat_57,Stat_58,Stat_59,Stat_60,Stat_61,Stat_62,Stat_63,Stat_64,Stat_65,Stat_66,Stat_67,Stat_68,Stat_69,Stat_70,Stat_71,Stat_72,Stat_73,Stat_74,Stat_75,Stat_76,Stat_77,Stat_78,Stat_79,Stat_80,Stat_81,Stat_82,Stat_83,Stat_84,Stat_85,Stat_86,Stat_87,Stat_88,Stat_89,Stat_90,Stat_91,Stat_92,Stat_93,Stat_94,Stat_95,sii
2065,Fall,11,1,Winter,999.0,Fall,,,,,,,,Fall,Fall,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,Fall,2.241,,,,Fall,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [11]:
train.loc[train['CGAS-CGAS_Score'] == 999, 'CGAS-CGAS_Score'] = np.nan

Replacing zero stats in these physical features as NaN value

In [12]:
physical_cols = [
    'Physical-BMI', 'Physical-Height',
    'Physical-Weight', 'Physical-Waist_Circumference'
]
print((train[physical_cols] == 0).sum())

Physical-BMI                     7
Physical-Height                  0
Physical-Weight                 61
Physical-Waist_Circumference     0
dtype: int64


In [13]:
train[physical_cols] = train[physical_cols].replace(0, np.nan)
print((train[physical_cols] == 0).sum())

Physical-BMI                    0
Physical-Height                 0
Physical-Weight                 0
Physical-Waist_Circumference    0
dtype: int64


In [14]:
bp_cols = [
      'Physical-Diastolic_BP', 'Physical-Systolic_BP'
]
train[bp_cols] = train[bp_cols].replace(0, np.nan)
train.loc[train['Physical-Systolic_BP'] <= train['Physical-Diastolic_BP'], bp_cols] = np.nan

Replacing extreme outliers in BIA-related columns with NaN values.


In [15]:
bia_columns = [col for col in train.columns if 'BIA' in col]

cat_col = ['BIA-Season', 'BIA-BIA_Activity_Level_num', 'BIA-BIA_Frame_num']
bia_columns = [col for col in bia_columns if col not in cat_col]
bia_columns

exclude_rows = []  # To store all indices to exclude

for col in bia_columns:
    Q1 = train[col].quantile(0.001)  # Lower quantile
    Q3 = train[col].quantile(0.999)  # Upper quantile

    # Replace with nan 
    train.loc[train[col] > Q3, col] = np.nan  # Replace above Q3 with NaN
    train.loc[train[col] < Q1, col] = np.nan  # Replace below Q1 with NaN
train

Unnamed: 0,Basic_Demos-Enroll_Season,Basic_Demos-Age,Basic_Demos-Sex,CGAS-Season,CGAS-CGAS_Score,Physical-Season,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Season,FGC-Season,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-Season,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_C-Season,PAQ_C-PAQ_C_Total,SDS-Season,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-Season,PreInt_EduHx-computerinternet_hoursday,Stat_0,Stat_1,Stat_2,Stat_3,Stat_4,Stat_5,Stat_6,Stat_7,Stat_8,Stat_9,Stat_10,Stat_11,Stat_12,Stat_13,Stat_14,Stat_15,Stat_16,Stat_17,Stat_18,Stat_19,Stat_20,Stat_21,Stat_22,Stat_23,Stat_24,Stat_25,Stat_26,Stat_27,Stat_28,Stat_29,Stat_30,Stat_31,Stat_32,Stat_33,Stat_34,Stat_35,Stat_36,Stat_37,Stat_38,Stat_39,Stat_40,Stat_41,Stat_42,Stat_43,Stat_44,Stat_45,Stat_46,Stat_47,Stat_48,Stat_49,Stat_50,Stat_51,Stat_52,Stat_53,Stat_54,Stat_55,Stat_56,Stat_57,Stat_58,Stat_59,Stat_60,Stat_61,Stat_62,Stat_63,Stat_64,Stat_65,Stat_66,Stat_67,Stat_68,Stat_69,Stat_70,Stat_71,Stat_72,Stat_73,Stat_74,Stat_75,Stat_76,Stat_77,Stat_78,Stat_79,Stat_80,Stat_81,Stat_82,Stat_83,Stat_84,Stat_85,Stat_86,Stat_87,Stat_88,Stat_89,Stat_90,Stat_91,Stat_92,Stat_93,Stat_94,Stat_95,sii
0,Fall,5,0,Winter,51.0,Fall,16.877316,46.0,50.8,,,,,,Fall,0.0,0.0,,,,,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,Fall,2.0,2.66855,16.8792,932.498,1492.00,8.25598,41.5862,13.8177,3.06143,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,,,,,,Fall,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0
1,Summer,9,0,,,Fall,14.035590,48.0,46.0,22.0,75.0,70.0,122.0,,Fall,3.0,0.0,,,,,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,Winter,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.21172,3.97085,1.0,21.0352,14.97400,39.4497,15.4107,27.0552,Fall,2.340,Fall,46.0,64.0,Summer,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0
2,Summer,10,1,Fall,71.0,Fall,16.648696,56.5,75.6,,65.0,94.0,117.0,Fall,Fall,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,,,,,,,,,,,,,,,,,,Summer,2.170,Fall,38.0,54.0,Summer,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0
3,Winter,9,0,Fall,71.0,Summer,18.292347,56.0,81.6,,60.0,97.0,117.0,Summer,Summer,18.0,1.0,,,,,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,Summer,3.0,3.84191,18.2943,1131.430,1923.44,15.59250,62.7757,14.0740,4.22033,18.82430,2.0,30.4041,16.77900,58.9338,26.4798,45.9966,Winter,2.451,Summer,31.0,45.0,Winter,0.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,-0.316384,0.016009,-0.167890,0.047388,-10.580416,0.000000,42.296310,4053.579102,5.046215e+13,4.470182,3.0,53.201683,0.453665,0.502702,0.585710,0.106351,42.947170,0.000000,208.168976,112.404045,1.942842e+13,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,0.0,0.0,3824.000000,5.500000e+10,1.0,3.0,41.0,-0.684180,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,3.689000e+13,3.0,3.0,42.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,5.347750e+13,5.0,3.0,50.0,-0.010677,0.400677,0.204727,0.041420,12.220764,0.0,15.000000,4147.0,6.640875e+13,6.0,3.0,53.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.250000,4188.5,8.611000e+13,7.0,3.0,85.0,1.0
4,Spring,18,1,Summer,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3955,Fall,13,0,Spring,60.0,Fall,16.362460,59.5,82.4,,71.0,70.0,104.0,,Fall,16.0,0.0,18.0,1.0,19.9,2.0,10.0,1.0,8.0,1.0,9.0,1.0,12.0,1.0,Fall,3.0,4.52277,16.3642,1206.880,2051.70,19.46110,70.8117,14.0629,2.30138,11.58830,1.0,33.3709,17.97970,66.2889,29.7790,52.8320,Winter,3.260,Winter,35.0,50.0,Fall,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0
3956,Winter,10,0,,,Spring,18.764678,53.5,76.4,27.0,60.0,78.0,118.0,,Spring,0.0,0.0,,,,,4.0,0.0,0.0,0.0,0.0,0.0,12.0,1.0,Spring,,,,,,,,,,,,,,,,,Winter,2.340,,,,Winter,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3957,Fall,11,0,Spring,68.0,Winter,21.441500,60.0,109.8,,79.0,99.0,116.0,,Winter,15.0,1.0,18.5,2.0,15.8,2.0,0.0,0.0,10.0,1.0,10.0,1.0,14.0,1.0,Winter,2.0,4.41305,21.4438,1253.740,2005.99,20.48250,75.8033,14.8043,6.63952,33.99670,2.0,33.9805,21.34030,71.3903,28.7792,54.4630,Winter,2.729,Winter,56.0,77.0,Fall,0.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,0.377523,-0.136917,-0.190545,0.028601,-12.374899,0.020323,22.480034,3844.479248,4.328291e+13,3.968833,1.0,60.263729,0.523033,0.422859,0.538802,0.072386,38.895920,0.139045,110.340538,167.268799,2.493436e+13,1.899374,0.0,6.960978,-1.852794,-0.992487,-1.006157,0.0,-89.627525,0.0,0.0,3098.166748,0.000000e+00,1.0,1.0,48.0,0.015931,-0.431110,-0.616714,0.000683,-39.189468,0.0,1.958715,3741.000000,2.168000e+13,2.0,1.0,54.0,0.538555,-0.153108,-0.277119,0.008805,-16.722418,0.0,5.282995,3812.0,4.336000e+13,4.0,1.0,60.0,0.813215,0.086647,0.148035,0.025942,8.457803,0.0,13.859835,3964.0,6.492500e+13,5.0,1.0,66.0,1.622884,2.286455,1.468296,3.078876,89.693832,1.0,2605.750000,4185.0,8.639500e+13,7.0,1.0,72.0,1.0
3958,Spring,13,0,Spring,70.0,Winter,12.235895,70.7,87.0,,59.0,61.0,113.0,,Spring,,,,,,,,,,,,,,,Summer,4.0,6.66168,12.2372,1414.340,2970.12,26.53230,92.9092,13.0684,-0.83117,-5.90917,2.0,41.3715,25.00540,86.2475,45.4340,67.9038,Spring,3.300,Spring,33.0,47.0,Spring,1.0,399000.0,399000.0,399000.0,399000.0,399000.0,399000.0,399000.0,399000.0,399000.0,399000.0,399000.0,399000.0,0.044563,0.080560,0.339411,0.017076,27.160025,0.592331,7.501198,3851.028809,4.321721e+13,3.824000,1.0,312.557983,0.321881,0.346819,0.807518,0.065688,67.432198,0.481510,14.348840,165.152405,2.489514e+13,1.999010,0.0,6.677634,-1.708816,-2.080256,-1.010877,0.0,-89.846863,0.0,0.0,3098.166748,0.000000e+00,1.0,1.0,301.0,-0.016745,-0.016340,-0.373187,0.000558,-22.638031,0.0,2.135821,3747.000000,2.168000e+13,2.0,1.0,307.0,0.028056,0.009200,0.855105,0.009563,57.570095,1.0,4.523121,3818.0,4.336500e+13,4.0,1.0,313.0,0.069484,0.076909,1.008843,0.014023,87.467171,1.0,7.471756,3970.0,6.471500e+13,6.0,1.0,318.0,1.755602,2.166893,1.467054,3.417329,89.931534,1.0,1186.599976,4189.0,8.639500e+13,7.0,1.0,324.0,0.0


In [16]:
def feature_transformation(data):
    return data


In [17]:
# train = train[featuresCols]
train = train.dropna(subset='sii')
train

Unnamed: 0,Basic_Demos-Enroll_Season,Basic_Demos-Age,Basic_Demos-Sex,CGAS-Season,CGAS-CGAS_Score,Physical-Season,Physical-BMI,Physical-Height,Physical-Weight,Physical-Waist_Circumference,Physical-Diastolic_BP,Physical-HeartRate,Physical-Systolic_BP,Fitness_Endurance-Season,FGC-Season,FGC-FGC_CU,FGC-FGC_CU_Zone,FGC-FGC_GSND,FGC-FGC_GSND_Zone,FGC-FGC_GSD,FGC-FGC_GSD_Zone,FGC-FGC_PU,FGC-FGC_PU_Zone,FGC-FGC_SRL,FGC-FGC_SRL_Zone,FGC-FGC_SRR,FGC-FGC_SRR_Zone,FGC-FGC_TL,FGC-FGC_TL_Zone,BIA-Season,BIA-BIA_Activity_Level_num,BIA-BIA_BMC,BIA-BIA_BMI,BIA-BIA_BMR,BIA-BIA_DEE,BIA-BIA_ECW,BIA-BIA_FFM,BIA-BIA_FFMI,BIA-BIA_FMI,BIA-BIA_Fat,BIA-BIA_Frame_num,BIA-BIA_ICW,BIA-BIA_LDM,BIA-BIA_LST,BIA-BIA_SMM,BIA-BIA_TBW,PAQ_C-Season,PAQ_C-PAQ_C_Total,SDS-Season,SDS-SDS_Total_Raw,SDS-SDS_Total_T,PreInt_EduHx-Season,PreInt_EduHx-computerinternet_hoursday,Stat_0,Stat_1,Stat_2,Stat_3,Stat_4,Stat_5,Stat_6,Stat_7,Stat_8,Stat_9,Stat_10,Stat_11,Stat_12,Stat_13,Stat_14,Stat_15,Stat_16,Stat_17,Stat_18,Stat_19,Stat_20,Stat_21,Stat_22,Stat_23,Stat_24,Stat_25,Stat_26,Stat_27,Stat_28,Stat_29,Stat_30,Stat_31,Stat_32,Stat_33,Stat_34,Stat_35,Stat_36,Stat_37,Stat_38,Stat_39,Stat_40,Stat_41,Stat_42,Stat_43,Stat_44,Stat_45,Stat_46,Stat_47,Stat_48,Stat_49,Stat_50,Stat_51,Stat_52,Stat_53,Stat_54,Stat_55,Stat_56,Stat_57,Stat_58,Stat_59,Stat_60,Stat_61,Stat_62,Stat_63,Stat_64,Stat_65,Stat_66,Stat_67,Stat_68,Stat_69,Stat_70,Stat_71,Stat_72,Stat_73,Stat_74,Stat_75,Stat_76,Stat_77,Stat_78,Stat_79,Stat_80,Stat_81,Stat_82,Stat_83,Stat_84,Stat_85,Stat_86,Stat_87,Stat_88,Stat_89,Stat_90,Stat_91,Stat_92,Stat_93,Stat_94,Stat_95,sii
0,Fall,5,0,Winter,51.0,Fall,16.877316,46.0,50.8,,,,,,Fall,0.0,0.0,,,,,0.0,0.0,7.0,0.0,6.0,0.0,6.0,1.0,Fall,2.0,2.66855,16.8792,932.498,1492.00,8.25598,41.5862,13.8177,3.061430,9.21377,1.0,24.4349,8.89536,38.9177,19.5413,32.6909,,,,,,Fall,3.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.0
1,Summer,9,0,,,Fall,14.035590,48.0,46.0,22.0,75.0,70.0,122.0,,Fall,3.0,0.0,,,,,5.0,0.0,11.0,1.0,11.0,1.0,3.0,0.0,Winter,2.0,2.57949,14.0371,936.656,1498.65,6.01993,42.0291,12.8254,1.211720,3.97085,1.0,21.0352,14.97400,39.4497,15.4107,27.0552,Fall,2.340,Fall,46.0,64.0,Summer,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0
2,Summer,10,1,Fall,71.0,Fall,16.648696,56.5,75.6,,65.0,94.0,117.0,Fall,Fall,20.0,1.0,10.2,1.0,14.7,2.0,7.0,1.0,10.0,1.0,10.0,1.0,5.0,0.0,,,,,,,,,,,,,,,,,,Summer,2.170,Fall,38.0,54.0,Summer,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0
3,Winter,9,0,Fall,71.0,Summer,18.292347,56.0,81.6,,60.0,97.0,117.0,Summer,Summer,18.0,1.0,,,,,5.0,0.0,7.0,0.0,7.0,0.0,7.0,1.0,Summer,3.0,3.84191,18.2943,1131.430,1923.44,15.59250,62.7757,14.0740,4.220330,18.82430,2.0,30.4041,16.77900,58.9338,26.4798,45.9966,Winter,2.451,Summer,31.0,45.0,Winter,0.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,43330.0,-0.316384,0.016009,-0.167890,0.047388,-10.580416,0.000000,42.296310,4053.579102,5.046215e+13,4.470182,3.0,53.201683,0.453665,0.502702,0.585710,0.106351,42.947170,0.000000,208.168976,112.404045,1.942842e+13,1.931421,0.0,14.244914,-1.746094,-2.905339,-1.048372,0.0,-89.833092,0.0,0.0,3824.000000,5.500000e+10,1.0,3.0,41.0,-0.684180,-0.309863,-0.649974,0.006432,-41.541863,0.0,2.392969,4028.666748,3.689000e+13,3.0,3.0,42.0,-0.366849,0.024974,-0.245378,0.023637,-15.086617,0.0,6.926828,4070.0,5.347750e+13,5.0,3.0,50.0,-0.010677,0.400677,0.204727,0.041420,12.220764,0.0,15.000000,4147.000000,6.640875e+13,6.0,3.0,53.0,1.507865,1.666354,1.546979,4.004276,89.751656,0.0,2633.250000,4188.5,8.611000e+13,7.0,3.0,85.0,1.0
5,Spring,13,1,Winter,50.0,Summer,22.279952,59.5,112.2,,60.0,73.0,102.0,,Summer,12.0,0.0,16.5,2.0,17.9,2.0,6.0,0.0,10.0,1.0,11.0,1.0,8.0,0.0,Summer,2.0,4.33036,30.1865,1330.970,1996.45,30.21240,84.0285,16.6877,13.498800,67.97150,2.0,32.9141,20.90200,79.6982,35.3804,63.1265,Spring,4.110,Summer,40.0,56.0,Spring,0.0,396396.0,396396.0,396396.0,396396.0,396396.0,396396.0,396396.0,396396.0,396396.0,396396.0,396396.0,396396.0,-0.004272,0.016859,-0.631731,0.011926,-55.630768,0.655708,16.771982,3838.189453,4.321212e+13,3.909848,3.0,79.435593,0.351545,0.303812,0.623476,0.024331,50.303635,0.468723,95.327438,155.573868,2.497264e+13,1.946892,0.0,6.634319,-1.038711,-1.522690,-1.018787,0.0,-88.761833,0.0,0.0,3098.166748,0.000000e+00,1.0,3.0,68.0,-0.052803,-0.044517,-1.009344,0.008622,-88.386049,0.0,0.500000,3747.000000,2.154000e+13,2.0,3.0,74.0,-0.020622,-0.028179,-1.007728,0.009831,-86.119919,1.0,0.879005,3812.0,4.331000e+13,4.0,3.0,79.0,-0.019081,0.020307,-0.294459,0.010668,-17.483364,1.0,6.141348,3951.187561,6.485500e+13,6.0,3.0,85.0,1.034351,1.946303,1.146284,2.952888,89.476036,1.0,2597.800049,4175.0,8.639500e+13,7.0,3.0,91.0,1.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3953,Fall,8,0,,,Fall,17.139810,52.5,67.2,25.0,60.0,65.0,112.0,,Fall,0.0,0.0,,,,,0.0,0.0,8.0,1.0,10.0,1.0,12.0,1.0,Fall,3.0,3.20303,17.1417,1035.270,1759.96,11.00630,52.5331,13.4004,3.741300,14.66690,1.0,25.7118,15.81500,49.3301,20.2645,36.7181,Fall,3.440,Fall,41.0,58.0,Fall,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0
3954,Summer,7,1,,,Summer,13.927006,48.5,46.6,23.0,65.0,75.0,105.0,,Summer,0.0,0.0,,,,,0.0,0.0,9.0,0.0,8.5,0.0,4.5,0.0,Fall,1.0,2.36680,13.6457,966.287,1256.17,9.98802,45.1853,13.2315,0.414263,1.41470,1.0,20.0572,15.14000,42.8185,18.0937,30.0453,,,Summer,48.0,67.0,Summer,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0
3955,Fall,13,0,Spring,60.0,Fall,16.362460,59.5,82.4,,71.0,70.0,104.0,,Fall,16.0,0.0,18.0,1.0,19.9,2.0,10.0,1.0,8.0,1.0,9.0,1.0,12.0,1.0,Fall,3.0,4.52277,16.3642,1206.880,2051.70,19.46110,70.8117,14.0629,2.301380,11.58830,1.0,33.3709,17.97970,66.2889,29.7790,52.8320,Winter,3.260,Winter,35.0,50.0,Fall,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0
3957,Fall,11,0,Spring,68.0,Winter,21.441500,60.0,109.8,,79.0,99.0,116.0,,Winter,15.0,1.0,18.5,2.0,15.8,2.0,0.0,0.0,10.0,1.0,10.0,1.0,14.0,1.0,Winter,2.0,4.41305,21.4438,1253.740,2005.99,20.48250,75.8033,14.8043,6.639520,33.99670,2.0,33.9805,21.34030,71.3903,28.7792,54.4630,Winter,2.729,Winter,56.0,77.0,Fall,0.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,416275.0,0.377523,-0.136917,-0.190545,0.028601,-12.374899,0.020323,22.480034,3844.479248,4.328291e+13,3.968833,1.0,60.263729,0.523033,0.422859,0.538802,0.072386,38.895920,0.139045,110.340538,167.268799,2.493436e+13,1.899374,0.0,6.960978,-1.852794,-0.992487,-1.006157,0.0,-89.627525,0.0,0.0,3098.166748,0.000000e+00,1.0,1.0,48.0,0.015931,-0.431110,-0.616714,0.000683,-39.189468,0.0,1.958715,3741.000000,2.168000e+13,2.0,1.0,54.0,0.538555,-0.153108,-0.277119,0.008805,-16.722418,0.0,5.282995,3812.0,4.336000e+13,4.0,1.0,60.0,0.813215,0.086647,0.148035,0.025942,8.457803,0.0,13.859835,3964.000000,6.492500e+13,5.0,1.0,66.0,1.622884,2.286455,1.468296,3.078876,89.693832,1.0,2605.750000,4185.0,8.639500e+13,7.0,1.0,72.0,1.0


In [18]:
cat_c = ['Basic_Demos-Enroll_Season', 'CGAS-Season', 'Physical-Season', 'Fitness_Endurance-Season', 
          'FGC-Season', 'BIA-Season', 
         'PAQ_A-Season', 
         'PAQ_C-Season', 'SDS-Season', 'PreInt_EduHx-Season']
final_cat_columns = [col for col in cat_c if col in train.columns]

def update(df):
    for c in final_cat_columns: 
        df[c] = df[c].fillna('Missing')
        df[c] = df[c].astype('category')
    return df

train = update(train)
test = update(test)


In [19]:
def create_mapping(column, dataset):
    unique_values = dataset[column].unique()
# enumerate adds index to an iterable. unique_values = ['A','B','C'] => enumerate returns [(0, 'A'), (1, 'B'), (2, 'C')]
    return {value: idx for idx, value in enumerate(unique_values)}

# Similar to Label Encoder
for col in final_cat_columns:
    all_values = pd.concat([train[col], test[col]]).unique()
    mapping = {value: idx for idx, value in enumerate(all_values)}

    train[col] = train[col].replace(mapping).astype(int)
    test[col] = test[col].replace(mapping).astype(int)

In [20]:
# Dropping features have importance = 0 when training Light model based on different seeds

columns_drop = ['Stat_39', 'Stat_45', 'Stat_41', 'Stat_89', 'Stat_6', 'Stat_42', 
                 'Stat_7', 'Stat_10', 'Stat_9', 'Stat_11'
                , 'Stat_93', 'Stat_8'
               ]
train = train.drop(columns = columns_drop)
test = test.drop(columns = columns_drop)


In [21]:
SEED = 42
n_splits = 5

In [22]:
# Low importance features across different seeds
low_imp_features = []

In [23]:
# High importance features across different seeds
high_imp_features = []

In [24]:
%%time


#We need Confusion matrix, weight matrix and expected matrix
def quadratic_weighted_kappa(y_true, y_pred):
    return cohen_kappa_score(y_true, y_pred, weights='quadratic')


def threshold_Rounder(oof_non_rounded, thresholds):
    return np.where(oof_non_rounded < thresholds[0], 0,
                    np.where(oof_non_rounded < thresholds[1], 1,
                             np.where(oof_non_rounded < thresholds[2], 2, 3)))


# Optimization libraries like scipy.optimize.minimize work by minimizing a function. 
# Since QWK is a metric where higher is better, we negate it to allow the optimizer to "maximize" QWK indirectly.
def evaluate_predictions(thresholds, y_true, oof_non_rounded):
    rounded_p = threshold_Rounder(oof_non_rounded, thresholds)
    return -quadratic_weighted_kappa(y_true, rounded_p)

# TrainML, is a machine learning pipeline that performs model training, cross-validation, evaluation, 
# and test set prediction for a classification or regression task. 

def TrainML(model_class, test_data
            # , k_values=[5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]
           ):
    
    X = train.drop(['sii'], axis=1)
    y = train['sii']

    # best_kappa = -np.inf
    # best_k = None
    # best_model = None
    # best_submission = None

    # for n_splits in k_values:
    #     print(f"\nEvaluating for k = {n_splits} folds...")

    # Cross-validation, ensuring that the folds have the same distribution of target classes. 
    SKF = StratifiedKFold(n_splits=n_splits, shuffle=True, random_state=SEED)
    
    # Store QWK scores for training and validation sets.
    train_S = []
    test_S = []

    # predictions made by the model for the validation set during each fold of cross-validation.
    oof_non_rounded = np.zeros(len(y), dtype=float) 
    # discrete predictions derived from oof_non_rounded using rounding logic
    oof_rounded = np.zeros(len(y), dtype=int) 
    # Stores the model's predictions for the test dataset during each fold of cross-validation
    test_preds = np.zeros((len(test_data), n_splits))

    for fold, (train_idx, test_idx) in enumerate(tqdm(SKF.split(X, y), desc="Training Folds", total=n_splits)):
        # train and test index are the index of this fold in the original training set
        # Data used for training in this fold
        X_train, X_val = X.iloc[train_idx], X.iloc[test_idx]
        # Data used for validation in this fold
        y_train, y_val = y.iloc[train_idx], y.iloc[test_idx]
        
        
        # Creates a new instance of an estimator with the same parameters as the original one 
        # but without any of the fitted data or state. Ensures each fold starts with a clean estimator.
        model = clone(model_class)
        model.fit(X_train, y_train)

        
        # Predict after fit to ensure model is trained correctly
        y_train_pred = model.predict(X_train)

        y_train_pred_rounded = y_train_pred.round(0).astype(int)
        
        y_val_pred = model.predict(X_val)

        # stores continuous data
        oof_non_rounded[test_idx] = y_val_pred
        # round the predicted value
        y_val_pred_rounded = y_val_pred.round(0).astype(int)
        oof_rounded[test_idx] = y_val_pred_rounded

        # Calcute QWK for train and validation set
        train_kappa = quadratic_weighted_kappa(y_train, y_train_pred_rounded)
        val_kappa = quadratic_weighted_kappa(y_val, y_val_pred_rounded)

        # Stores QWK score each fold
        train_S.append(train_kappa)
        test_S.append(val_kappa)

        
        test_preds[:, fold] = model.predict(test_data)
        print(test_preds[:, fold])
        
        print(f"Fold {fold+1} - Train QWK: {train_kappa:.4f}, Validation QWK: {val_kappa:.4f}")
        clear_output(wait=True)


    print(f"Mean Train QWK --> {np.mean(train_S):.4f}")
    print(f"Mean Validation QWK ---> {np.mean(test_S):.4f}")

    #Minimize the kappa score, which find the best Threshold Rounder  
    KappaOPtimizer = minimize(evaluate_predictions,
                              x0=[0.5, 1.5, 2.5], args=(y, oof_non_rounded), 
                              method='Nelder-Mead') # Nelder-Mead | # Powell

    # If not converge, raise error
    assert KappaOPtimizer.success, "Optimization did not converge."

# rounded the oof_non_rounded which has a bunch of predicted continuous variables for the validation set at each fold
    oof_tuned = threshold_Rounder(oof_non_rounded, KappaOPtimizer.x)
    tKappa = quadratic_weighted_kappa(y, oof_tuned)

    

    print(f"----> || Optimized QWK SCORE :: {Fore.CYAN}{Style.BRIGHT} {tKappa:.3f}{Style.RESET_ALL}")

# Rounded the test predict variables with optimized ThresHold_Rounder
    tpm = test_preds.mean(axis=1)
    tpTuned = threshold_Rounder(tpm, KappaOPtimizer.x)
    
    submission = pd.DataFrame({
        'id': sample['id'],
        'sii': tpTuned
    })

        # if tKappa > best_kappa:
        #     best_kappa = tKappa
        #     best_k = n_splits
        #     best_model = model
        #     best_submission = submission

    # print(f"Best k value: {best_k} with QWK Score: {best_kappa:.4f}")

    return submission,model

CPU times: user 5 µs, sys: 0 ns, total: 5 µs
Wall time: 9.06 µs


# Hyperparameter Optimization using Optuna  

## Purpose of Hyperparameter Tuning  
To improve model performance, we used **Optuna** to optimize key hyperparameters for our model.  
The primary goal was to maximize the **QWK (Quadratic Weighted Kappa)** score while ensuring the model generalizes well without overfitting.

---

## Optuna Hyperparameter Tuning Process  

1. **Search Parameters**:  
   Optuna was configured to suggest optimal values for the following hyperparameters:  
   - **num_leaves**  
   - **max_depth**  
   - **learning_rate**  
   - **feature_fraction**  
   - **bagging_fraction**  
   - **bagging_freq**  
   - **lambda_l1** (L1 regularization)  
   - **lambda_l2** (L2 regularization)  
   - **min_data_in_leaf**  

2. **Cross-Validation Strategy**:  
   - **K-Fold Cross-Validation** was applied to split the data into multiple training and testing sets.  
   - The **average QWK score** across the folds was used to evaluate model performance.  

3. **Search Space Limitation**:  
   - Based on references from **Kaggle competitions** and iterative experiments, we adopted a **narrowed search space**.  
   - This ensures efficient exploration while focusing on high-performing parameter ranges.  
## Reason for Trials  
We limited the **number of trials to 50** for the following reasons:  
- **Efficient runtime**: Prevent excessively long computation times.  
- **Stable performance**: 50 trials provided consistent and optimal results without diminishing returns.  

---

## Result  
- With the optimized hyperparameters, the model achieved its **best QWK score**.  
- The **training score** was also reduced, minimizing overfitting and ensuring **better generalization** on unseen data.

### Optimal Hyperparameters  
After 50 trials (sufficient to balance time and performance), the following hyperparameters were identified as optimal:  

{
    'num_leaves': 484, 
    'max_depth': 11, 
    'learning_rate': 0.04533585929025977, 
    'feature_fraction': 0.8110477902071817, 
    'bagging_fraction': 0.7265461551046623, 
    'bagging_freq': 2, 
    'lambda_l1': 5.338437863405547, 
    'lambda_l2': 4.499492326361118e-06, 
    'min_data_in_leaf': 13
} data.  
2326361118e-06, 
    'min_data_in_leaf': 13
}


In [25]:
import optuna
import lightgbm as lgb
from sklearn.metrics import cohen_kappa_score
from sklearn.model_selection import StratifiedKFold
import numpy as np

def quadratic_weighted_kappa(y_true, y_pred):
    return cohen_kappa_score(y_true, y_pred, weights='quadratic')


def objective(trial):
    params = {
        'objective': 'regression',
        'metric': 'mae',  
        'boosting_type': 'gbdt',
        'num_leaves': trial.suggest_int('num_leaves', 400, 500), 
        'max_depth': trial.suggest_int('max_depth', 10, 15),
        'learning_rate': trial.suggest_uniform('learning_rate', 0.03, 0.05), 
        'feature_fraction': trial.suggest_uniform('feature_fraction', 0.7, 0.9),  
        'bagging_fraction': trial.suggest_uniform('bagging_fraction', 0.7, 0.9),  
        'bagging_freq': trial.suggest_int('bagging_freq', 2, 3),  
        'lambda_l1': trial.suggest_uniform('lambda_l1', 4, 6), 
        'lambda_l2': trial.suggest_loguniform('lambda_l2', 1e-6, 1e-4),  
        'min_data_in_leaf': trial.suggest_int('min_data_in_leaf', 10, 15), 
    }

    X = train.drop(['sii'], axis=1)
    y = train['sii']

    n_splits = 5
    SKF = StratifiedKFold(n_splits=n_splits, shuffle=True, random_state=42)
    
    kappa_scores = []
    
    for train_idx, val_idx in SKF.split(X, y):
        X_train, X_val = X.iloc[train_idx], X.iloc[val_idx]
        y_train, y_val = y.iloc[train_idx], y.iloc[val_idx]
        
        model = lgb.LGBMRegressor(**params, random_state=42)
        model.fit(X_train, y_train)
        
        y_pred = model.predict(X_val)
        y_pred_rounded = np.round(y_pred).astype(int)  # Làm tròn dự đoán cho QWK
        kappa = quadratic_weighted_kappa(y_val, y_pred_rounded)
        
        kappa_scores.append(kappa)
    
    # Trả về điểm số trung bình của QWK trên các fold
    return np.mean(kappa_scores)

In [26]:
study = optuna.create_study(direction='maximize')  
study.optimize(objective, n_trials=50)  

print("Best parameters:", study.best_params)
print("Best QWK score:", study.best_value)

[I 2024-12-18 14:32:00,875] A new study created in memory with name: no-name-844849d8-b232-4cbd-823e-35801470c26d


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001870 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001994 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002021 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:03,956] Trial 0 finished with value: 0.37271249619244584 and parameters: {'num_leaves': 494, 'max_depth': 12, 'learning_rate': 0.03203993350910327, 'feature_fraction': 0.7227863256058192, 'bagging_fraction': 0.7769704370575458, 'bagging_freq': 3, 'lambda_l1': 4.996715291910336, 'lambda_l2': 2.870870283961034e-06, 'min_data_in_leaf': 13}. Best is trial 0 with value: 0.37271249619244584.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002004 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001996 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002736 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:07,988] Trial 1 finished with value: 0.3845275852077261 and parameters: {'num_leaves': 443, 'max_depth': 12, 'learning_rate': 0.04723993930644106, 'feature_fraction': 0.7284449408321994, 'bagging_fraction': 0.7658810922914697, 'bagging_freq': 3, 'lambda_l1': 4.1467269905334145, 'lambda_l2': 1.1306392744418763e-06, 'min_data_in_leaf': 13}. Best is trial 1 with value: 0.3845275852077261.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001979 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002031 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002049 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:11,925] Trial 2 finished with value: 0.3787766370200577 and parameters: {'num_leaves': 405, 'max_depth': 11, 'learning_rate': 0.032366883271355326, 'feature_fraction': 0.8375824729001298, 'bagging_fraction': 0.7590095334185382, 'bagging_freq': 3, 'lambda_l1': 4.257094380015129, 'lambda_l2': 1.4176490823385383e-05, 'min_data_in_leaf': 10}. Best is trial 1 with value: 0.3845275852077261.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001929 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002165 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002240 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:14,666] Trial 3 finished with value: 0.37245927535742107 and parameters: {'num_leaves': 471, 'max_depth': 14, 'learning_rate': 0.0300915206560529, 'feature_fraction': 0.7270870722559943, 'bagging_fraction': 0.75696912747646, 'bagging_freq': 2, 'lambda_l1': 5.129594442937534, 'lambda_l2': 2.2471226031760927e-05, 'min_data_in_leaf': 15}. Best is trial 1 with value: 0.3845275852077261.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002099 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002037 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001976 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:17,538] Trial 4 finished with value: 0.37478801529803896 and parameters: {'num_leaves': 454, 'max_depth': 14, 'learning_rate': 0.039461255648342596, 'feature_fraction': 0.736720203400067, 'bagging_fraction': 0.7403281669718513, 'bagging_freq': 2, 'lambda_l1': 4.728815783892609, 'lambda_l2': 6.3559670592671125e-06, 'min_data_in_leaf': 15}. Best is trial 1 with value: 0.3845275852077261.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001932 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002131 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002013 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:20,231] Trial 5 finished with value: 0.3944730914408609 and parameters: {'num_leaves': 479, 'max_depth': 15, 'learning_rate': 0.045710517953144875, 'feature_fraction': 0.7016855098713247, 'bagging_fraction': 0.7281910550496355, 'bagging_freq': 2, 'lambda_l1': 5.041656824397862, 'lambda_l2': 2.115778729719539e-06, 'min_data_in_leaf': 14}. Best is trial 5 with value: 0.3944730914408609.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001981 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002050 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002251 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:23,808] Trial 6 finished with value: 0.387457299000532 and parameters: {'num_leaves': 446, 'max_depth': 11, 'learning_rate': 0.0366495117399283, 'feature_fraction': 0.7679881240534797, 'bagging_fraction': 0.8562081418274192, 'bagging_freq': 3, 'lambda_l1': 4.464689604428841, 'lambda_l2': 5.2404346348138065e-05, 'min_data_in_leaf': 12}. Best is trial 5 with value: 0.3944730914408609.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002319 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002004 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002151 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:26,914] Trial 7 finished with value: 0.3874309564959549 and parameters: {'num_leaves': 490, 'max_depth': 15, 'learning_rate': 0.042764444059428544, 'feature_fraction': 0.7558487977350188, 'bagging_fraction': 0.7648753988900922, 'bagging_freq': 2, 'lambda_l1': 4.394148205354118, 'lambda_l2': 2.9111579324390027e-05, 'min_data_in_leaf': 14}. Best is trial 5 with value: 0.3944730914408609.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001995 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002084 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002046 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:30,834] Trial 8 finished with value: 0.3884622837110562 and parameters: {'num_leaves': 416, 'max_depth': 13, 'learning_rate': 0.04234090421341109, 'feature_fraction': 0.8301808244954427, 'bagging_fraction': 0.7857404687526378, 'bagging_freq': 3, 'lambda_l1': 4.095968487713227, 'lambda_l2': 3.294030438245316e-05, 'min_data_in_leaf': 11}. Best is trial 5 with value: 0.3944730914408609.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001962 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002003 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002104 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:34,823] Trial 9 finished with value: 0.3869006634955382 and parameters: {'num_leaves': 451, 'max_depth': 15, 'learning_rate': 0.03429361478974163, 'feature_fraction': 0.8549402236862549, 'bagging_fraction': 0.8308257915925854, 'bagging_freq': 3, 'lambda_l1': 4.0532768580180445, 'lambda_l2': 1.9652119625100106e-06, 'min_data_in_leaf': 12}. Best is trial 5 with value: 0.3944730914408609.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001947 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002293 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002223 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:38,247] Trial 10 finished with value: 0.3932927895349 and parameters: {'num_leaves': 479, 'max_depth': 10, 'learning_rate': 0.049408908991398104, 'feature_fraction': 0.8872797624939308, 'bagging_fraction': 0.7021450244137029, 'bagging_freq': 2, 'lambda_l1': 5.722044374361018, 'lambda_l2': 5.842481355266098e-06, 'min_data_in_leaf': 14}. Best is trial 5 with value: 0.3944730914408609.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003514 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002093 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002063 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:41,281] Trial 11 finished with value: 0.3908272150111915 and parameters: {'num_leaves': 474, 'max_depth': 10, 'learning_rate': 0.04980302295203925, 'feature_fraction': 0.8942355076254693, 'bagging_fraction': 0.7034904543140595, 'bagging_freq': 2, 'lambda_l1': 5.85863805615595, 'lambda_l2': 5.502518052341985e-06, 'min_data_in_leaf': 14}. Best is trial 5 with value: 0.3944730914408609.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001899 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002025 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002007 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:44,021] Trial 12 finished with value: 0.3812046935417415 and parameters: {'num_leaves': 475, 'max_depth': 10, 'learning_rate': 0.04630939523955934, 'feature_fraction': 0.7997869665441356, 'bagging_fraction': 0.7012538326588661, 'bagging_freq': 2, 'lambda_l1': 5.8521457862914215, 'lambda_l2': 3.8445088466634135e-06, 'min_data_in_leaf': 14}. Best is trial 5 with value: 0.3944730914408609.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001987 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002115 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002053 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:47,165] Trial 13 finished with value: 0.39060457924597003 and parameters: {'num_leaves': 498, 'max_depth': 13, 'learning_rate': 0.048650864425662035, 'feature_fraction': 0.8864143454202299, 'bagging_fraction': 0.7261343922900009, 'bagging_freq': 2, 'lambda_l1': 5.4634408078348216, 'lambda_l2': 1.008722189757911e-06, 'min_data_in_leaf': 14}. Best is trial 5 with value: 0.3944730914408609.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003760 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002036 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001994 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:50,446] Trial 14 finished with value: 0.3986849269684639 and parameters: {'num_leaves': 466, 'max_depth': 11, 'learning_rate': 0.044768339073847974, 'feature_fraction': 0.7859077064413899, 'bagging_fraction': 0.8985646295588963, 'bagging_freq': 2, 'lambda_l1': 5.489643152666449, 'lambda_l2': 8.456093687363228e-06, 'min_data_in_leaf': 15}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001928 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002004 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001975 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:53,503] Trial 15 finished with value: 0.39011809191004554 and parameters: {'num_leaves': 464, 'max_depth': 11, 'learning_rate': 0.044555814357998366, 'feature_fraction': 0.7020475999055407, 'bagging_fraction': 0.8962865522972089, 'bagging_freq': 2, 'lambda_l1': 5.200212118132602, 'lambda_l2': 9.435020255632075e-05, 'min_data_in_leaf': 15}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002019 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002212 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002017 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:32:56,670] Trial 16 finished with value: 0.3922967691718674 and parameters: {'num_leaves': 433, 'max_depth': 14, 'learning_rate': 0.04050338629279775, 'feature_fraction': 0.7900418120197549, 'bagging_fraction': 0.8155407538298, 'bagging_freq': 2, 'lambda_l1': 5.402306718335476, 'lambda_l2': 1.1033250825784206e-05, 'min_data_in_leaf': 15}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001972 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002057 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002070 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:00,387] Trial 17 finished with value: 0.398096730991863 and parameters: {'num_leaves': 486, 'max_depth': 12, 'learning_rate': 0.04493367378062049, 'feature_fraction': 0.77050126890997, 'bagging_fraction': 0.8994847499184835, 'bagging_freq': 2, 'lambda_l1': 4.819263320315036, 'lambda_l2': 1.9983947248851254e-06, 'min_data_in_leaf': 13}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002288 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000693 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002104 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train 

[I 2024-12-18 14:33:04,565] Trial 18 finished with value: 0.39286996586560674 and parameters: {'num_leaves': 463, 'max_depth': 12, 'learning_rate': 0.043451364714652, 'feature_fraction': 0.7765044148421871, 'bagging_fraction': 0.8970055190696132, 'bagging_freq': 2, 'lambda_l1': 4.774808215638422, 'lambda_l2': 1.605541075243152e-05, 'min_data_in_leaf': 11}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002423 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002311 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002041 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:08,158] Trial 19 finished with value: 0.3941401570303003 and parameters: {'num_leaves': 488, 'max_depth': 11, 'learning_rate': 0.03969921223508699, 'feature_fraction': 0.8211823940508359, 'bagging_fraction': 0.8654619259993155, 'bagging_freq': 2, 'lambda_l1': 5.421507317043827, 'lambda_l2': 6.8963730415350035e-06, 'min_data_in_leaf': 13}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001974 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003301 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001999 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:12,664] Trial 20 finished with value: 0.38557023394261347 and parameters: {'num_leaves': 434, 'max_depth': 13, 'learning_rate': 0.04083326872892219, 'feature_fraction': 0.8117976010950954, 'bagging_fraction': 0.8732122408496821, 'bagging_freq': 2, 'lambda_l1': 4.740884702214372, 'lambda_l2': 1.5536655664003324e-06, 'min_data_in_leaf': 12}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002307 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002113 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002018 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:16,038] Trial 21 finished with value: 0.3895026593500839 and parameters: {'num_leaves': 483, 'max_depth': 12, 'learning_rate': 0.04582046307719741, 'feature_fraction': 0.7536046446923601, 'bagging_fraction': 0.8422500862310786, 'bagging_freq': 2, 'lambda_l1': 4.934468872727416, 'lambda_l2': 2.38639569731608e-06, 'min_data_in_leaf': 13}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002214 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002009 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002035 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:18,975] Trial 22 finished with value: 0.3826745815215638 and parameters: {'num_leaves': 464, 'max_depth': 11, 'learning_rate': 0.044705248566316955, 'feature_fraction': 0.7037587322679838, 'bagging_fraction': 0.8076618575824966, 'bagging_freq': 2, 'lambda_l1': 5.200431995048798, 'lambda_l2': 3.870494772251127e-06, 'min_data_in_leaf': 14}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002705 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002026 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002059 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:22,161] Trial 23 finished with value: 0.3931822807226852 and parameters: {'num_leaves': 500, 'max_depth': 13, 'learning_rate': 0.04698323172656714, 'feature_fraction': 0.7721157613203832, 'bagging_fraction': 0.8810448896603443, 'bagging_freq': 2, 'lambda_l1': 5.6268771563450315, 'lambda_l2': 1.5822128175048307e-06, 'min_data_in_leaf': 15}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002380 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002084 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002083 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:25,694] Trial 24 finished with value: 0.3777016820921069 and parameters: {'num_leaves': 483, 'max_depth': 12, 'learning_rate': 0.037429277376671524, 'feature_fraction': 0.7922041137685876, 'bagging_fraction': 0.8532405542257304, 'bagging_freq': 2, 'lambda_l1': 4.946777383808059, 'lambda_l2': 3.3993039551702475e-06, 'min_data_in_leaf': 13}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002055 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002005 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002109 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:29,184] Trial 25 finished with value: 0.3852772743816274 and parameters: {'num_leaves': 469, 'max_depth': 15, 'learning_rate': 0.047934781251010125, 'feature_fraction': 0.7540287539430328, 'bagging_fraction': 0.886177863335589, 'bagging_freq': 2, 'lambda_l1': 4.501345331981247, 'lambda_l2': 8.633953628109342e-06, 'min_data_in_leaf': 14}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002051 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002030 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002026 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:32,663] Trial 26 finished with value: 0.3888659623530102 and parameters: {'num_leaves': 457, 'max_depth': 14, 'learning_rate': 0.044487761988944795, 'feature_fraction': 0.8562418263866503, 'bagging_fraction': 0.8269822284535645, 'bagging_freq': 2, 'lambda_l1': 4.618613868816297, 'lambda_l2': 1.923914480483493e-06, 'min_data_in_leaf': 15}. Best is trial 14 with value: 0.3986849269684639.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002001 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002193 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002101 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:35,746] Trial 27 finished with value: 0.4031979760172506 and parameters: {'num_leaves': 484, 'max_depth': 11, 'learning_rate': 0.04533585929025977, 'feature_fraction': 0.8110477902071817, 'bagging_fraction': 0.7265461551046623, 'bagging_freq': 2, 'lambda_l1': 5.338437863405547, 'lambda_l2': 4.499492326361118e-06, 'min_data_in_leaf': 13}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001988 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002034 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002026 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:39,321] Trial 28 finished with value: 0.39233848575243885 and parameters: {'num_leaves': 488, 'max_depth': 11, 'learning_rate': 0.041774853141178, 'feature_fraction': 0.8083261363178115, 'bagging_fraction': 0.7932210565825445, 'bagging_freq': 2, 'lambda_l1': 5.298012726866787, 'lambda_l2': 4.32115948485392e-06, 'min_data_in_leaf': 11}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002037 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002040 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003112 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:43,563] Trial 29 finished with value: 0.39033745040439594 and parameters: {'num_leaves': 494, 'max_depth': 10, 'learning_rate': 0.03827472356282211, 'feature_fraction': 0.7815078174506835, 'bagging_fraction': 0.8683289622057699, 'bagging_freq': 3, 'lambda_l1': 5.582643580784553, 'lambda_l2': 2.9612770073290177e-06, 'min_data_in_leaf': 12}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001979 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002032 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002227 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:47,567] Trial 30 finished with value: 0.3760643434436102 and parameters: {'num_leaves': 459, 'max_depth': 12, 'learning_rate': 0.04366710841852225, 'feature_fraction': 0.8435789894095016, 'bagging_fraction': 0.8897649057402397, 'bagging_freq': 2, 'lambda_l1': 5.952551830245417, 'lambda_l2': 8.464445385531675e-06, 'min_data_in_leaf': 10}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001935 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002046 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002036 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:50,638] Trial 31 finished with value: 0.3995332353478968 and parameters: {'num_leaves': 479, 'max_depth': 11, 'learning_rate': 0.045655878627798345, 'feature_fraction': 0.8094179182368659, 'bagging_fraction': 0.718519740019229, 'bagging_freq': 2, 'lambda_l1': 5.08346424405795, 'lambda_l2': 2.3556037459965286e-06, 'min_data_in_leaf': 13}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002090 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002157 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002664 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:53,670] Trial 32 finished with value: 0.38517287866703 and parameters: {'num_leaves': 483, 'max_depth': 11, 'learning_rate': 0.04540203067750981, 'feature_fraction': 0.8134027301144849, 'bagging_fraction': 0.7186422427085872, 'bagging_freq': 2, 'lambda_l1': 5.308269958070206, 'lambda_l2': 2.7108136971954177e-06, 'min_data_in_leaf': 13}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001970 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002542 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002399 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:33:56,912] Trial 33 finished with value: 0.38632071499420834 and parameters: {'num_leaves': 468, 'max_depth': 12, 'learning_rate': 0.04778643782609253, 'feature_fraction': 0.79737640948894, 'bagging_fraction': 0.7450208321891283, 'bagging_freq': 2, 'lambda_l1': 4.895236378666901, 'lambda_l2': 1.2466327652041125e-06, 'min_data_in_leaf': 13}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001990 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002118 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002059 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:00,302] Trial 34 finished with value: 0.3864683904344024 and parameters: {'num_leaves': 494, 'max_depth': 11, 'learning_rate': 0.046929960792109246, 'feature_fraction': 0.8279070839002899, 'bagging_fraction': 0.7766122472251971, 'bagging_freq': 2, 'lambda_l1': 5.063289101077154, 'lambda_l2': 4.9462662335996496e-06, 'min_data_in_leaf': 13}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002072 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002076 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002045 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:03,526] Trial 35 finished with value: 0.3848845097182493 and parameters: {'num_leaves': 477, 'max_depth': 12, 'learning_rate': 0.0435623158435117, 'feature_fraction': 0.783117286410837, 'bagging_fraction': 0.7461921113869853, 'bagging_freq': 3, 'lambda_l1': 4.8384322065762735, 'lambda_l2': 1.4854091334665919e-05, 'min_data_in_leaf': 12}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001974 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002048 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002064 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:06,454] Trial 36 finished with value: 0.3942147167930673 and parameters: {'num_leaves': 485, 'max_depth': 10, 'learning_rate': 0.0413720481314098, 'feature_fraction': 0.7666208465728545, 'bagging_fraction': 0.7292020536990009, 'bagging_freq': 2, 'lambda_l1': 5.264670236026727, 'lambda_l2': 1.410258336825843e-06, 'min_data_in_leaf': 13}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002533 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002015 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002103 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:09,528] Trial 37 finished with value: 0.39556516928888125 and parameters: {'num_leaves': 470, 'max_depth': 11, 'learning_rate': 0.04847595910072519, 'feature_fraction': 0.7391431025196583, 'bagging_fraction': 0.777541902829887, 'bagging_freq': 2, 'lambda_l1': 5.546540839153176, 'lambda_l2': 1.1029952116250476e-05, 'min_data_in_leaf': 12}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001990 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002124 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002706 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:12,554] Trial 38 finished with value: 0.39527720711885717 and parameters: {'num_leaves': 492, 'max_depth': 11, 'learning_rate': 0.046135077385433, 'feature_fraction': 0.8053143688336468, 'bagging_fraction': 0.7121548711644035, 'bagging_freq': 2, 'lambda_l1': 5.1190746543166155, 'lambda_l2': 3.053324750017268e-06, 'min_data_in_leaf': 13}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001959 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003852 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002094 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:16,579] Trial 39 finished with value: 0.39785473483874834 and parameters: {'num_leaves': 444, 'max_depth': 12, 'learning_rate': 0.04269375597559851, 'feature_fraction': 0.7605902302240076, 'bagging_fraction': 0.7326397484119901, 'bagging_freq': 3, 'lambda_l1': 4.246889506919647, 'lambda_l2': 7.12185276104734e-06, 'min_data_in_leaf': 11}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001965 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002088 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002188 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:19,922] Trial 40 finished with value: 0.4007424802365029 and parameters: {'num_leaves': 479, 'max_depth': 10, 'learning_rate': 0.04527935563826528, 'feature_fraction': 0.7875888154728745, 'bagging_fraction': 0.7561672335367349, 'bagging_freq': 2, 'lambda_l1': 5.71197169639354, 'lambda_l2': 2.293146435964413e-06, 'min_data_in_leaf': 10}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002050 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002038 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002008 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:23,256] Trial 41 finished with value: 0.3900202003328235 and parameters: {'num_leaves': 477, 'max_depth': 10, 'learning_rate': 0.0454869331079458, 'feature_fraction': 0.7856617005502068, 'bagging_fraction': 0.7480975721283402, 'bagging_freq': 2, 'lambda_l1': 5.499080632012515, 'lambda_l2': 2.283256441655423e-06, 'min_data_in_leaf': 10}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001991 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002035 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002050 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:26,418] Trial 42 finished with value: 0.38933654427768133 and parameters: {'num_leaves': 481, 'max_depth': 10, 'learning_rate': 0.04435229901337465, 'feature_fraction': 0.8188972657084821, 'bagging_fraction': 0.7556680507492282, 'bagging_freq': 2, 'lambda_l1': 5.707037146390576, 'lambda_l2': 1.7782769419730777e-06, 'min_data_in_leaf': 12}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002123 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002085 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002061 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:29,536] Trial 43 finished with value: 0.38766076482981554 and parameters: {'num_leaves': 472, 'max_depth': 11, 'learning_rate': 0.04661727025033865, 'feature_fraction': 0.7469419234779885, 'bagging_fraction': 0.7155078332001987, 'bagging_freq': 2, 'lambda_l1': 5.691697090331867, 'lambda_l2': 4.7774960877402495e-06, 'min_data_in_leaf': 10}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002117 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002065 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002072 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:32,775] Trial 44 finished with value: 0.3758499439057674 and parameters: {'num_leaves': 405, 'max_depth': 10, 'learning_rate': 0.03440617159214165, 'feature_fraction': 0.8366870413327101, 'bagging_fraction': 0.7351033604603565, 'bagging_freq': 2, 'lambda_l1': 4.6347230586880235, 'lambda_l2': 2.4748042399602256e-06, 'min_data_in_leaf': 13}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002029 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001998 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002052 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:36,100] Trial 45 finished with value: 0.3944056700854176 and parameters: {'num_leaves': 486, 'max_depth': 11, 'learning_rate': 0.03020495921307897, 'feature_fraction': 0.7995358094468639, 'bagging_fraction': 0.7665806393231639, 'bagging_freq': 2, 'lambda_l1': 5.3834944004618634, 'lambda_l2': 3.6242853047505553e-06, 'min_data_in_leaf': 11}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.001973 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002099 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002051 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:38,981] Trial 46 finished with value: 0.3913527019719178 and parameters: {'num_leaves': 474, 'max_depth': 10, 'learning_rate': 0.04233014275963911, 'feature_fraction': 0.7665673246128879, 'bagging_fraction': 0.7178905633392377, 'bagging_freq': 2, 'lambda_l1': 4.993403716787289, 'lambda_l2': 1.2261494952383096e-06, 'min_data_in_leaf': 14}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002027 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002037 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002093 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:41,796] Trial 47 finished with value: 0.38881138992587594 and parameters: {'num_leaves': 480, 'max_depth': 11, 'learning_rate': 0.0489660988295018, 'feature_fraction': 0.7192693463906547, 'bagging_fraction': 0.7553907362739091, 'bagging_freq': 2, 'lambda_l1': 5.144844860210567, 'lambda_l2': 2.1855401903111696e-05, 'min_data_in_leaf': 14}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002009 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002097 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002027 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:45,601] Trial 48 finished with value: 0.3797849231693233 and parameters: {'num_leaves': 451, 'max_depth': 10, 'learning_rate': 0.04488435035551296, 'feature_fraction': 0.792660008062601, 'bagging_fraction': 0.877205618367105, 'bagging_freq': 2, 'lambda_l1': 5.824683468025137, 'lambda_l2': 1.9490586253288278e-06, 'min_data_in_leaf': 12}. Best is trial 27 with value: 0.4031979760172506.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003242 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21896
[LightGBM] [Info] Number of data points in the train set: 2188, number of used features: 137
[LightGBM] [Info] Start training from score 0.579982
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002063 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21880
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start training from score 0.581087
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.002087 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 21967
[LightGBM] [Info] Number of data points in the train set: 2189, number of used features: 137
[LightGBM] [Info] Start 

[I 2024-12-18 14:34:48,951] Trial 49 finished with value: 0.40272366582353936 and parameters: {'num_leaves': 497, 'max_depth': 11, 'learning_rate': 0.04748707138438789, 'feature_fraction': 0.7753133273807322, 'bagging_fraction': 0.8522001537154474, 'bagging_freq': 2, 'lambda_l1': 5.796158884528135, 'lambda_l2': 5.578615501615373e-06, 'min_data_in_leaf': 14}. Best is trial 27 with value: 0.4031979760172506.


Best parameters: {'num_leaves': 484, 'max_depth': 11, 'learning_rate': 0.04533585929025977, 'feature_fraction': 0.8110477902071817, 'bagging_fraction': 0.7265461551046623, 'bagging_freq': 2, 'lambda_l1': 5.338437863405547, 'lambda_l2': 4.499492326361118e-06, 'min_data_in_leaf': 13}
Best QWK score: 0.4031979760172506
