In [1]:
import pandas as pd

df = pd.read_csv(r"C:\Users\anime\OneDrive\Desktop\Data Science Projects\Youtube Comment Analysis\youtube_comment_analyser\data\processed\reddit_preprocessing.csv")
df

Unnamed: 0,clean_comment,category
0,family mormon never tried explain still stare ...,1
1,buddhism much lot compatible christianity espe...,1
2,seriously say thing first get complex explain ...,-1
3,learned want teach different focus goal not wr...,0
4,benefit may want read living buddha living chr...,1
...,...,...
36788,jesus,0
36789,kya bhai pure saal chutiya banaya modi aur jab...,1
36790,downvote karna tha par upvote hogaya,0
36791,haha nice,1


In [2]:
df =  df.dropna(subset=["clean_comment"])
df.shape

(36661, 2)

In [None]:
import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.model_selection import train_test_split, cross_val_score
from sklearn.metrics import accuracy_score, classification_report
from imblearn.over_sampling import SMOTE
import mlflow
import mlflow.sklearn
import os
import optuna
from lightgbm import LGBMClassifier
import matplotlib.pyplot as plt
from imblearn.under_sampling import RandomUnderSampler
from sklearn.model_selection import StratifiedKFold
import numpy as np

  from .autonotebook import tqdm as notebook_tqdm


In [None]:
mlflow.set_tracking_uri(os.getenv("MLFLOW_TRACKING_URI"))
mlflow.set_experiment("LightGBM detailed HP tuning Balanced class weights")

2025/04/06 13:11:55 INFO mlflow.tracking.fluent: Experiment with name 'LightGBM detailed HP tuning Balanced class weights' does not exist. Creating a new experiment.


<Experiment: artifact_location='s3://datascienceanimesh/101796172817218503', creation_time=1743925315513, experiment_id='101796172817218503', last_update_time=1743925315513, lifecycle_stage='active', name='LightGBM detailed HP tuning Balanced class weights', tags={}>

In [6]:
import pandas as pd
import numpy as np
import optuna
import mlflow
import mlflow.sklearn
from sklearn.model_selection import train_test_split, cross_val_score, StratifiedKFold
from sklearn.feature_extraction.text import TfidfVectorizer
from lightgbm import LGBMClassifier
from sklearn.metrics import accuracy_score, classification_report

# === Preprocessing ===

df['category'] = df['category'].map({-1: 2, 0: 0, 1: 1})
df = df.dropna(subset=['category'])

X_train_raw, X_test_raw, y_train, y_test = train_test_split(
    df['clean_comment'], df['category'], test_size=0.2, random_state=42, stratify=df['category']
)

vectorizer = TfidfVectorizer(ngram_range=(1, 3), max_features=1000)
X_train = vectorizer.fit_transform(X_train_raw)
X_test = vectorizer.transform(X_test_raw)

# === Logging Function ===

def log_mlflow(model_name, model, X_train, X_test, y_train, y_test, params, trial_number):
    with mlflow.start_run():
        mlflow.set_tag("mlflow.runName", f"Trial_{trial_number}_{model_name}_TFIDF_Trigrams")
        mlflow.set_tag("experiment_type", "algorithm_comparison")

        mlflow.log_param("algo_name", model_name)
        for key, value in params.items():
            mlflow.log_param(key, value)

        model.fit(X_train, y_train)
        y_pred = model.predict(X_test)

        accuracy = accuracy_score(y_test, y_pred)
        mlflow.log_metric("accuracy", accuracy)

        classification_rep = classification_report(y_test, y_pred, output_dict=True)
        for label, metrics in classification_rep.items():
            if isinstance(metrics, dict):
                for metric, value in metrics.items():
                    mlflow.log_metric(f"{label}_{metric}", value)

        mlflow.sklearn.log_model(model, f"{model_name}_model")

# === Optuna Objective Function ===

def objective(trial):
    params = {
        "objective": "multiclass",
        "num_class": 3,
        "learning_rate": trial.suggest_float("learning_rate", 1e-3, 1e-1),
        "n_estimators": trial.suggest_int("n_estimators", 50, 500),
        "max_depth": trial.suggest_int("max_depth", 3, 20),
        'reg_alpha': trial.suggest_float('reg_alpha', 1e-4, 10.0, log=True),
        'reg_lambda': trial.suggest_float('reg_lambda', 1e-4, 10.0, log=True),
        "metric": "multi_logloss",
        "class_weight": "balanced",
        "random_state": 42
    }

    model = LGBMClassifier(**params)
    cv = StratifiedKFold(n_splits=3, shuffle=True, random_state=42)
    scores = cross_val_score(model, X_train, y_train, cv=cv, scoring='accuracy')

    return scores.mean()

# === Run Experiment ===

def run_optuna_experiment():
    study = optuna.create_study(direction="maximize")
    study.optimize(objective, n_trials=30)

    best_params = study.best_params
    best_model = LGBMClassifier(
        n_estimators=best_params['n_estimators'],
        learning_rate=best_params['learning_rate'],
        max_depth=best_params['max_depth'],
        objective="multiclass",
        num_class=3,
        class_weight="balanced",
        random_state=42
    )

    best_model.fit(X_train, y_train)

    # Log best model with MLflow
    log_mlflow("LightGBM", best_model, X_train, X_test, y_train, y_test, best_params, study.best_trial.number)

# Execute
run_optuna_experiment()


[I 2025-04-06 13:45:44,325] A new study created in memory with name: no-name-de83033f-7dda-4d61-8fa6-8f7bf5a3a609


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.013872 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.020763 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.




[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.019453 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776






[I 2025-04-06 13:45:48,397] Trial 0 finished with value: 0.8718430182729863 and parameters: {'learning_rate': 0.039190326280721825, 'n_estimators': 257, 'max_depth': 6, 'reg_alpha': 0.37119563876876144, 'reg_lambda': 0.00015530572260014962}. Best is trial 0 with value: 0.8718430182729863.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.012299 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.013468 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] S







[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.012423 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:45:50,432] Trial 1 finished with value: 0.852617404642154 and parameters: {'learning_rate': 0.0467223022692332, 'n_estimators': 58, 'max_depth': 18, 'reg_alpha': 3.15042942473613, 'reg_lambda': 0.00013906910866117502}. Best is trial 0 with value: 0.8718430182729863.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.020802 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.012623 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.023527 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:45:51,920] Trial 2 finished with value: 0.6540688541440344 and parameters: {'learning_rate': 0.0016885099494965898, 'n_estimators': 103, 'max_depth': 4, 'reg_alpha': 0.000263105168193079, 'reg_lambda': 0.0014322156623057167}. Best is trial 0 with value: 0.8718430182729863.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.021649 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.013995 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776








[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.022019 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:46:01,879] Trial 3 finished with value: 0.8850415506513744 and parameters: {'learning_rate': 0.02354743359617505, 'n_estimators': 424, 'max_depth': 8, 'reg_alpha': 0.00011835118048036246, 'reg_lambda': 0.0004408013314769716}. Best is trial 3 with value: 0.8850415506513744.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.021175 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.017855 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.028657 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:46:09,083] Trial 4 finished with value: 0.901099724397047 and parameters: {'learning_rate': 0.08144486903004376, 'n_estimators': 304, 'max_depth': 9, 'reg_alpha': 0.00038634827976187096, 'reg_lambda': 0.055964002210524486}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.018583 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.028191 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.017527 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776






[I 2025-04-06 13:46:17,203] Trial 5 finished with value: 0.8707432102571292 and parameters: {'learning_rate': 0.02278910711334188, 'n_estimators': 327, 'max_depth': 8, 'reg_alpha': 0.0001180272506402551, 'reg_lambda': 0.30880106262268975}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.017882 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.017443 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.018576 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:46:26,054] Trial 6 finished with value: 0.8539813435749651 and parameters: {'learning_rate': 0.019897302505853833, 'n_estimators': 322, 'max_depth': 10, 'reg_alpha': 0.44138467184174507, 'reg_lambda': 9.398564320675542}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.019728 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.018498 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.021493 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:46:34,460] Trial 7 finished with value: 0.8995159202549705 and parameters: {'learning_rate': 0.0783481257153346, 'n_estimators': 459, 'max_depth': 8, 'reg_alpha': 1.2132065651013368, 'reg_lambda': 0.0018740364997732093}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.032109 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.019284 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.017587 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:46:42,173] Trial 8 finished with value: 0.8985919730494717 and parameters: {'learning_rate': 0.09347301397992329, 'n_estimators': 221, 'max_depth': 16, 'reg_alpha': 0.006221932605206866, 'reg_lambda': 0.002411039186983275}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.019169 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.020144 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776








[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.022101 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:46:44,515] Trial 9 finished with value: 0.8568409210667699 and parameters: {'learning_rate': 0.07826055712096597, 'n_estimators': 63, 'max_depth': 13, 'reg_alpha': 5.303926533053495, 'reg_lambda': 0.3413597914239731}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.027509 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.018448 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.017944 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:46:51,096] Trial 10 finished with value: 0.9000438452908929 and parameters: {'learning_rate': 0.06659592485971687, 'n_estimators': 193, 'max_depth': 13, 'reg_alpha': 0.003382101406196237, 'reg_lambda': 0.023639590039999735}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.017622 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.021083 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.025503 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:46:57,018] Trial 11 finished with value: 0.8995599130401537 and parameters: {'learning_rate': 0.06709674169144739, 'n_estimators': 169, 'max_depth': 13, 'reg_alpha': 0.0023090675763629757, 'reg_lambda': 0.04356819815407308}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.018876 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.028907 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.020025 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:47:03,878] Trial 12 finished with value: 0.8999558539136645 and parameters: {'learning_rate': 0.06419623102922378, 'n_estimators': 176, 'max_depth': 15, 'reg_alpha': 0.00226724651737524, 'reg_lambda': 0.022434232029696362}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.020395 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.019409 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.035473 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:47:18,313] Trial 13 finished with value: 0.8945005162764711 and parameters: {'learning_rate': 0.0920770704238568, 'n_estimators': 374, 'max_depth': 20, 'reg_alpha': 0.030143779391763194, 'reg_lambda': 0.022569382999414862}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.019024 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.018772 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.029124 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:47:26,889] Trial 14 finished with value: 0.9004397687438184 and parameters: {'learning_rate': 0.059145987679707065, 'n_estimators': 294, 'max_depth': 11, 'reg_alpha': 0.0009296407769070868, 'reg_lambda': 0.2600771674491967}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.020788 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.018452 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.019336 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:47:34,881] Trial 15 finished with value: 0.8985480499466303 and parameters: {'learning_rate': 0.05402223179849441, 'n_estimators': 299, 'max_depth': 10, 'reg_alpha': 0.0008244975376978107, 'reg_lambda': 0.81105794628091}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.021218 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.029151 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.018814 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:47:38,535] Trial 16 finished with value: 0.8789702733735828 and parameters: {'learning_rate': 0.08034053886191013, 'n_estimators': 377, 'max_depth': 3, 'reg_alpha': 0.051825052981132165, 'reg_lambda': 3.199655356614412}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.019041 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.021965 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.020529 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:47:46,891] Trial 17 finished with value: 0.9003518005940373 and parameters: {'learning_rate': 0.05585768345947247, 'n_estimators': 264, 'max_depth': 11, 'reg_alpha': 0.0007164711499911326, 'reg_lambda': 0.09001807253737719}. Best is trial 4 with value: 0.901099724397047.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.020081 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.019397 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.029675 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:47:53,489] Trial 18 finished with value: 0.9014956826911432 and parameters: {'learning_rate': 0.09999880250422176, 'n_estimators': 363, 'max_depth': 6, 'reg_alpha': 0.02215567900216331, 'reg_lambda': 0.007320946065820303}. Best is trial 18 with value: 0.9014956826911432.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.021659 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.025273 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.019859 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:48:01,861] Trial 19 finished with value: 0.9014956826911432 and parameters: {'learning_rate': 0.09891383916297276, 'n_estimators': 495, 'max_depth': 5, 'reg_alpha': 0.022456834296823547, 'reg_lambda': 0.007141464264235266}. Best is trial 18 with value: 0.9014956826911432.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.033642 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.025258 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.020417 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:48:09,841] Trial 20 finished with value: 0.9014956943048668 and parameters: {'learning_rate': 0.09753761576880648, 'n_estimators': 492, 'max_depth': 5, 'reg_alpha': 0.0264687959991935, 'reg_lambda': 0.006685854418852646}. Best is trial 20 with value: 0.9014956943048668.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.019367 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.021350 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.026278 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:48:17,509] Trial 21 finished with value: 0.9019796439761915 and parameters: {'learning_rate': 0.09990876157398487, 'n_estimators': 500, 'max_depth': 5, 'reg_alpha': 0.027114917538161865, 'reg_lambda': 0.0071763991623728365}. Best is trial 21 with value: 0.9019796439761915.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.022556 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.020579 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.026411 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:48:26,363] Trial 22 finished with value: 0.9004397397095092 and parameters: {'learning_rate': 0.09929028752026714, 'n_estimators': 495, 'max_depth': 6, 'reg_alpha': 0.09676052709908568, 'reg_lambda': 0.004065098845367495}. Best is trial 21 with value: 0.9019796439761915.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.035819 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.020698 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.022462 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:48:31,067] Trial 23 finished with value: 0.897008209555428 and parameters: {'learning_rate': 0.08746359502644935, 'n_estimators': 434, 'max_depth': 3, 'reg_alpha': 0.012826535270192323, 'reg_lambda': 0.005286268888847246}. Best is trial 21 with value: 0.9019796439761915.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.020479 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.022211 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.023061 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:48:38,682] Trial 24 finished with value: 0.9011437287959536 and parameters: {'learning_rate': 0.08906046267934892, 'n_estimators': 404, 'max_depth': 6, 'reg_alpha': 0.11363517650171567, 'reg_lambda': 0.0008892797321549664}. Best is trial 21 with value: 0.9019796439761915.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.040239 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.022914 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.022599 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:48:45,992] Trial 25 finished with value: 0.9010557548393109 and parameters: {'learning_rate': 0.09908417510832485, 'n_estimators': 466, 'max_depth': 5, 'reg_alpha': 0.19962894566665784, 'reg_lambda': 0.010449172103380621}. Best is trial 21 with value: 0.9019796439761915.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.021294 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.023741 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.023171 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:48:54,793] Trial 26 finished with value: 0.900923718415143 and parameters: {'learning_rate': 0.07250668827333073, 'n_estimators': 363, 'max_depth': 7, 'reg_alpha': 0.01008988671370274, 'reg_lambda': 0.0004799830625362204}. Best is trial 21 with value: 0.9019796439761915.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.022203 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.030287 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.022706 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:49:01,358] Trial 27 finished with value: 0.9007917342527314 and parameters: {'learning_rate': 0.08512362317387909, 'n_estimators': 458, 'max_depth': 4, 'reg_alpha': 0.06189445679865331, 'reg_lambda': 0.008125173081954158}. Best is trial 21 with value: 0.9019796439761915.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.027737 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.028680 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.039597 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:49:09,050] Trial 28 finished with value: 0.9015396928969119 and parameters: {'learning_rate': 0.09337157228505982, 'n_estimators': 500, 'max_depth': 4, 'reg_alpha': 0.015590102169279958, 'reg_lambda': 0.012945328617750315}. Best is trial 21 with value: 0.9019796439761915.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.027012 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43989
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 961
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.022405 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43942
[LightGBM] [Info] Number of data points in the train set: 15153, number of used features: 958
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.032370 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 43888
[LightGBM] [Info] Number of data points in the train set: 15154, number of used features: 960
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776


[I 2025-04-06 13:49:14,914] Trial 29 finished with value: 0.8630441592795255 and parameters: {'learning_rate': 0.03510506348147473, 'n_estimators': 497, 'max_depth': 3, 'reg_alpha': 0.5670234893906688, 'reg_lambda': 0.09232793718512286}. Best is trial 21 with value: 0.9019796439761915.


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.038501 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 62268
[LightGBM] [Info] Number of data points in the train set: 22730, number of used features: 963
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.019374 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 62268
[LightGBM] [Info] Number of data points in the train set: 22730, number of used features: 963
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -0.693147
[LightGBM] [Info] Start training from score -34.538776




🏃 View run Trial_21_LightGBM_TFIDF_Trigrams at: http://ec2-13-49-0-142.eu-north-1.compute.amazonaws.com:5000/#/experiments/101796172817218503/runs/bc01f90f4903451493edc843f74c41c0
🧪 View experiment at: http://ec2-13-49-0-142.eu-north-1.compute.amazonaws.com:5000/#/experiments/101796172817218503
