In [18]:
import pandas as pd
import optuna
import lightgbm as lgb
from sklearn.model_selection import train_test_split,cross_val_score,GridSearchCV
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics import classification_report,accuracy_score

In [19]:
# laoding the cleaned data
data = pd.read_csv(r"C:\Users\Varun\Downloads\Saurav\MLOPS_Chrome_plugin\data\preprocessed_data.csv")

# drop the rows with NaN values
df = data.dropna()

In [20]:
# Separating the input and output features
X = df.clean_comment
y = df.category

In [21]:
# Spliting the train and test data
X_train,X_test,y_train,y_test = train_test_split(X,y,train_size = 0.2,random_state = 42)

In [48]:
# Applying the Tfidf with trigram and max_features = 10000
tf_idf = TfidfVectorizer(ngram_range = (1,3),max_features = 5000)

In [49]:
# Fitting the vectorizer on training data and transforming the test data
X_train_tfidf = tf_idf.fit_transform(X_train)
X_test_tfidf = tf_idf.transform(X_test)

In [50]:
# Function to optimize the LightGBM hyperparameters
def objective(trial):
    param = {
        # Core Parameters
        'objective': 'multiclass', # Change to 'multiclass' for multi-class
        'num_class': 3,
        'learning_rate': trial.suggest_float('learning_rate', 1e-3, 1e-1),
        'n_estimators': trial.suggest_int('n_estimators', 50, 500), 
        'max_depth': trial.suggest_int('max_depth', 3, 20),
        'metric' : 'multi_logloss',
        'is_unbalance' : True,
        'class_weight' : 'balanced',
    }

    # defining the model with trial parameters
    model = lgb.LGBMClassifier(**param)

    # perform cross-validation
    scores = cross_val_score(model,X_train_tfidf,y_train,cv = 3,scoring = "accuracy")

    # return the average score across folds
    return scores.mean()

In [51]:
# craete an Optuna study to optimize the hyperparameters
study = optuna.create_study(direction = "maximize")
study.optimize(objective,n_trials = 50)

[I 2025-10-21 22:20:22,675] A new study created in memory with name: no-name-5c054144-acbf-4e70-83e1-d1878b18632a


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004500 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004906 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005091 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:20:25,782] Trial 0 finished with value: 0.7258592471358428 and parameters: {'learning_rate': 0.08525182728477844, 'n_estimators': 273, 'max_depth': 19}. Best is trial 0 with value: 0.7258592471358428.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003721 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004649 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005502 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:20:26,434] Trial 1 finished with value: 0.6194762684124385 and parameters: {'learning_rate': 0.013055514419443363, 'n_estimators': 66, 'max_depth': 7}. Best is trial 0 with value: 0.7258592471358428.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003748 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003830 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003853 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:20:27,178] Trial 2 finished with value: 0.7291325695581015 and parameters: {'learning_rate': 0.080381503365253, 'n_estimators': 280, 'max_depth': 3}. Best is trial 2 with value: 0.7291325695581015.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003614 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003732 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003634 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:20:27,944] Trial 3 finished with value: 0.623567921440262 and parameters: {'learning_rate': 0.011589406526687475, 'n_estimators': 90, 'max_depth': 7}. Best is trial 2 with value: 0.7291325695581015.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003638 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005268 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004016 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:20:28,480] Trial 4 finished with value: 0.6913529732678669 and parameters: {'learning_rate': 0.049488996916742724, 'n_estimators': 91, 'max_depth': 5}. Best is trial 2 with value: 0.7291325695581015.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004511 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005513 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003785 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:20:32,136] Trial 5 finished with value: 0.7306328423349701 and parameters: {'learning_rate': 0.05314731107182183, 'n_estimators': 364, 'max_depth': 16}. Best is trial 5 with value: 0.7306328423349701.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.012454 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004392 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003977 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star





[I 2025-10-21 22:20:34,562] Trial 6 finished with value: 0.7287234042553191 and parameters: {'learning_rate': 0.08672199254528612, 'n_estimators': 228, 'max_depth': 15}. Best is trial 5 with value: 0.7306328423349701.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003951 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003748 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004166 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:20:36,050] Trial 7 finished with value: 0.7355428259683578 and parameters: {'learning_rate': 0.07196155557792265, 'n_estimators': 147, 'max_depth': 15}. Best is trial 7 with value: 0.7355428259683578.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005346 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003749 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003592 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:20:36,958] Trial 8 finished with value: 0.5830605564648118 and parameters: {'learning_rate': 0.005436535651090346, 'n_estimators': 283, 'max_depth': 3}. Best is trial 7 with value: 0.7355428259683578.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005452 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004027 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004590 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star





[I 2025-10-21 22:20:38,910] Trial 9 finished with value: 0.7369067103109656 and parameters: {'learning_rate': 0.05810008048690408, 'n_estimators': 334, 'max_depth': 7}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004855 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005377 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003796 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star





[I 2025-10-21 22:20:42,273] Trial 10 finished with value: 0.7354064375340971 and parameters: {'learning_rate': 0.03666541417202929, 'n_estimators': 452, 'max_depth': 10}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003893 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003754 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003729 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:20:43,742] Trial 11 finished with value: 0.7332242225859247 and parameters: {'learning_rate': 0.06115514856403145, 'n_estimators': 166, 'max_depth': 12}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003845 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004531 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005321 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star





[I 2025-10-21 22:20:46,534] Trial 12 finished with value: 0.7309056192034916 and parameters: {'learning_rate': 0.06861802600697192, 'n_estimators': 400, 'max_depth': 11}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004581 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004043 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star







[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.021513 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:20:48,121] Trial 13 finished with value: 0.731860338243317 and parameters: {'learning_rate': 0.09986080071204867, 'n_estimators': 166, 'max_depth': 14}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004523 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003720 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003832 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:20:52,094] Trial 14 finished with value: 0.7321331151118385 and parameters: {'learning_rate': 0.03809562210055058, 'n_estimators': 354, 'max_depth': 19}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003574 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003914 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003594 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:20:53,507] Trial 15 finished with value: 0.7339061647572285 and parameters: {'learning_rate': 0.07151375935653191, 'n_estimators': 187, 'max_depth': 9}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003666 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005567 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005538 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:20:57,598] Trial 16 finished with value: 0.7352700490998364 and parameters: {'learning_rate': 0.029971466934592114, 'n_estimators': 331, 'max_depth': 17}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005157 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004109 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004174 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:01,775] Trial 17 finished with value: 0.7254500818330606 and parameters: {'learning_rate': 0.05308424453809238, 'n_estimators': 497, 'max_depth': 13}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004605 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003981 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.005605 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:03,211] Trial 18 finished with value: 0.7354064375340972 and parameters: {'learning_rate': 0.09616956489530276, 'n_estimators': 214, 'max_depth': 8}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003909 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003997 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004406 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:03,776] Trial 19 finished with value: 0.7184942716857611 and parameters: {'learning_rate': 0.07288950756686399, 'n_estimators': 111, 'max_depth': 5}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003856 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005544 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005111 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star





[I 2025-10-21 22:21:05,700] Trial 20 finished with value: 0.7366339334424441 and parameters: {'learning_rate': 0.061370544742506444, 'n_estimators': 134, 'max_depth': 20}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004941 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004197 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.005300 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:21:07,622] Trial 21 finished with value: 0.7343153300600109 and parameters: {'learning_rate': 0.06259999209099554, 'n_estimators': 133, 'max_depth': 20}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.007210 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005392 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star







[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005146 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:10,467] Trial 22 finished with value: 0.7343153300600109 and parameters: {'learning_rate': 0.04596819519520353, 'n_estimators': 243, 'max_depth': 17}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005200 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005928 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004774 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:11,405] Trial 23 finished with value: 0.7298145117294054 and parameters: {'learning_rate': 0.0622054161992334, 'n_estimators': 56, 'max_depth': 18}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004832 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005868 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.005343 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:21:12,992] Trial 24 finished with value: 0.7349972722313147 and parameters: {'learning_rate': 0.0783509216461605, 'n_estimators': 134, 'max_depth': 15}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005786 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004372 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star







[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003706 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:15,314] Trial 25 finished with value: 0.7332242225859247 and parameters: {'learning_rate': 0.05951575292448512, 'n_estimators': 312, 'max_depth': 12}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005253 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003736 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004061 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:21:17,514] Trial 26 finished with value: 0.7345881069285324 and parameters: {'learning_rate': 0.04288169681403778, 'n_estimators': 199, 'max_depth': 20}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004387 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.010109 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003725 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:19,485] Trial 27 finished with value: 0.7313147845062739 and parameters: {'learning_rate': 0.0251467801309796, 'n_estimators': 254, 'max_depth': 10}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005192 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004159 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005452 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:21,013] Trial 28 finished with value: 0.7351336606655755 and parameters: {'learning_rate': 0.0678209894253804, 'n_estimators': 404, 'max_depth': 5}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003575 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004032 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612








[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004593 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:22,457] Trial 29 finished with value: 0.7352700490998364 and parameters: {'learning_rate': 0.08092074472570399, 'n_estimators': 154, 'max_depth': 14}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003585 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003739 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005301 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:26,497] Trial 30 finished with value: 0.7193126022913257 and parameters: {'learning_rate': 0.08599563671593274, 'n_estimators': 415, 'max_depth': 18}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005358 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004502 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005835 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:21:28,033] Trial 31 finished with value: 0.7317239498090561 and parameters: {'learning_rate': 0.05552827577271821, 'n_estimators': 211, 'max_depth': 8}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005239 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.006067 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003657 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star





[I 2025-10-21 22:21:29,124] Trial 32 finished with value: 0.7359519912711402 and parameters: {'learning_rate': 0.09771590670189566, 'n_estimators': 191, 'max_depth': 7}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004283 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004497 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003649 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:29,872] Trial 33 finished with value: 0.7325422804146209 and parameters: {'learning_rate': 0.0893082965896364, 'n_estimators': 130, 'max_depth': 7}. Best is trial 9 with value: 0.7369067103109656.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004132 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003961 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003600 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:31,248] Trial 34 finished with value: 0.7382705946535734 and parameters: {'learning_rate': 0.07792795490058824, 'n_estimators': 294, 'max_depth': 6}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004231 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004253 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005170 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:32,534] Trial 35 finished with value: 0.7352700490998364 and parameters: {'learning_rate': 0.09017012423735557, 'n_estimators': 299, 'max_depth': 6}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004317 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005993 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004115 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:21:33,447] Trial 36 finished with value: 0.7315875613747954 and parameters: {'learning_rate': 0.07924402602800609, 'n_estimators': 267, 'max_depth': 4}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003852 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003714 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.005308 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:21:35,146] Trial 37 finished with value: 0.7340425531914895 and parameters: {'learning_rate': 0.09706914406444994, 'n_estimators': 329, 'max_depth': 6}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003813 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004195 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004639 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:35,868] Trial 38 finished with value: 0.7302236770321877 and parameters: {'learning_rate': 0.0913799657322529, 'n_estimators': 88, 'max_depth': 8}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.006315 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004075 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005429 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:36,930] Trial 39 finished with value: 0.7332242225859247 and parameters: {'learning_rate': 0.07569346336765372, 'n_estimators': 377, 'max_depth': 3}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005537 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.005308 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005770 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:38,319] Trial 40 finished with value: 0.7319967266775778 and parameters: {'learning_rate': 0.06577854604472856, 'n_estimators': 232, 'max_depth': 6}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003611 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003851 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:38,998] Trial 41 finished with value: 0.7152209492635025 and parameters: {'learning_rate': 0.0568565836339356, 'n_estimators': 80, 'max_depth': 9}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003690 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005170 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.005007 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:39,697] Trial 42 finished with value: 0.7303600654664484 and parameters: {'learning_rate': 0.08450801408069379, 'n_estimators': 108, 'max_depth': 7}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.005652 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003669 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004991 s







[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003650 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:41,928] Trial 43 finished with value: 0.7319967266775778 and parameters: {'learning_rate': 0.07284985276898417, 'n_estimators': 291, 'max_depth': 11}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.003935 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005257 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612








[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004317 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:43,325] Trial 44 finished with value: 0.7310420076377523 and parameters: {'learning_rate': 0.051159482371338424, 'n_estimators': 173, 'max_depth': 9}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004893 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005656 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.004431 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:44,534] Trial 45 finished with value: 0.7296781232951446 and parameters: {'learning_rate': 0.06603472212486725, 'n_estimators': 262, 'max_depth': 4}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005880 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.006022 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star







[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004839 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:47,972] Trial 46 finished with value: 0.7309056192034915 and parameters: {'learning_rate': 0.04803434795733115, 'n_estimators': 337, 'max_depth': 16}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004023 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004947 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star







[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003771 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


[I 2025-10-21 22:21:49,239] Trial 47 finished with value: 0.7324058919803601 and parameters: {'learning_rate': 0.08343499264314805, 'n_estimators': 151, 'max_depth': 10}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003710 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.004199 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003650 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:21:50,981] Trial 48 finished with value: 0.7344517184942717 and parameters: {'learning_rate': 0.07082398432803655, 'n_estimators': 193, 'max_depth': 13}. Best is trial 34 with value: 0.7382705946535734.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003844 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15745
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 761
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.005723 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 16121
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 784
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Star



[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.003873 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 15640
[LightGBM] [Info] Number of data points in the train set: 4888, number of used features: 773
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612






[I 2025-10-21 22:21:52,181] Trial 49 finished with value: 0.7334969994544464 and parameters: {'learning_rate': 0.07587938334907489, 'n_estimators': 357, 'max_depth': 4}. Best is trial 34 with value: 0.7382705946535734.




In [52]:
# Extracts the best_parameters
best_params = study.best_params
best_params

{'learning_rate': 0.07792795490058824, 'n_estimators': 294, 'max_depth': 6}

In [65]:
# Best Model 
best_model = lgb.LGBMClassifier(

        objective = "multiclass",
        num_class = 3,
        metric    = "multi_logloss",
     is_unbalance = True,
     class_weight = "balanced",
    learning_rate = 0.08,
        max_depth = 20,
     n_estimators = 282
)

In [66]:
# fitting the best model
best_model.fit(X_train_tfidf,y_train)

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.008066 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 26751
[LightGBM] [Info] Number of data points in the train set: 7332, number of used features: 1189
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612
[LightGBM] [Info] Start training from score -1.098612


In [67]:
# Prediction on train set
y_train_pred = best_model.predict(X_train_tfidf)



In [68]:
# Calculate the accuracy on train set
train_score = accuracy_score(y_train,y_train_pred)
train_score

0.918848881614839

In [69]:
# Classification report 
train_report = classification_report(y_train,y_train_pred)
print(train_report)

              precision    recall  f1-score   support

          -1       0.93      0.90      0.92      1730
           0       0.84      0.99      0.91      2429
           1       0.99      0.88      0.93      3173

    accuracy                           0.92      7332
   macro avg       0.92      0.92      0.92      7332
weighted avg       0.93      0.92      0.92      7332



In [70]:
# Prediction on test data
y_pred = best_model.predict(X_test_tfidf)



In [71]:
# Accuracy on test set
accuracy = accuracy_score(y_test,y_pred)
accuracy

0.7725196045005114

In [72]:
# Classification report 
train_report = classification_report(y_test,y_pred)
print(train_report)

              precision    recall  f1-score   support

          -1       0.67      0.63      0.65      6518
           0       0.76      0.90      0.82     10215
           1       0.84      0.75      0.79     12597

    accuracy                           0.77     29330
   macro avg       0.76      0.76      0.75     29330
weighted avg       0.78      0.77      0.77     29330

