In [14]:
import pandas as pd
import numpy as np
from sklearn.model_selection import TimeSeriesSplit
from sklearn.metrics import mean_squared_error
import lightgbm as lgb
import optuna
import joblib

In [15]:
# Cargar datos
sellin = pd.read_csv("datasets/sell-in.csv", sep='\t')
productos = pd.read_csv("datasets/tb_productos.csv", sep='\t')
stocks = pd.read_csv("datasets/tb_stocks.csv", sep='\t')
productos = productos.drop_duplicates(subset=['product_id'], keep='first')

# Merge inicial
df = sellin.merge(productos, on="product_id", how="left").merge(stocks, on=["product_id", "periodo"], how="left")
df['periodo_dt'] = pd.to_datetime(df['periodo'].astype(str), format='%Y%m')

In [16]:
# Feature engineering
vida_producto = df.groupby("product_id")["periodo_dt"].agg(["min", "max"]).reset_index()
periodos_producto = [(p, row["product_id"]) for _, row in vida_producto.iterrows() 
                     for p in pd.date_range(row["min"], row["max"], freq="MS")]
df_pp = pd.DataFrame(periodos_producto, columns=["periodo_dt", "product_id"])
df_pp['periodo'] = df_pp['periodo_dt'].dt.strftime('%Y%m').astype(int)
df_pp = df_pp.merge(productos, on="product_id", how="left").merge(stocks, on=["product_id", "periodo"], how="left")

ventas = df.groupby(['periodo', 'product_id']).agg({'tn':'sum'}).reset_index()
df_pp = df_pp.merge(ventas, on=['periodo', 'product_id'], how='left')
df_pp['tn'] = df_pp['tn'].fillna(0)

df_pp['periodo_dt'] = pd.to_datetime(df_pp['periodo'].astype(str), format='%Y%m')
df_pp['month'] = df_pp['periodo_dt'].dt.month
df_pp['quarter'] = df_pp['periodo_dt'].dt.quarter
df_pp['year'] = df_pp['periodo_dt'].dt.year
df_pp['stock_ratio'] = df_pp.apply(lambda x: x['tn']/x['stock_final'] if x['stock_final']>0 else 0, axis=1)
df_pp['stock_ratio'] = df_pp['stock_ratio'].replace([np.inf, -np.inf], 0).fillna(0)

df_pp = df_pp.sort_values(['product_id','periodo_dt'])
for lag in range(1,4):
    df_pp[f'tn_lag_{lag}'] = df_pp.groupby('product_id')['tn'].shift(lag)
df_pp['tn_diff'] = df_pp['tn'] - df_pp['tn_lag_1']

df_pp['tn_target'] = df_pp.groupby('product_id')['tn'].shift(-2)
train_data = df_pp[~df_pp['periodo'].isin([201911,201912])]
test_data = df_pp[df_pp['periodo'] == 201912]

In [29]:
df_pp.shape

(31522, 19)

In [26]:
import lightgbm as lgb
from sklearn.model_selection import TimeSeriesSplit
from sklearn.metrics import mean_squared_error
import optuna
import numpy as np
import pandas as pd

# Suponemos que df_pp ya est√° cargado con features y target
X = df_pp.drop(columns=['periodo_dt', 'tn_target', 'tn'], errors='ignore')
y = df_pp['tn_target']

# Identificar columnas categ√≥ricas
cols_categoricas = X.select_dtypes(include=['object', 'category']).columns.tolist()
print(f"Columnas categ√≥ricas: {cols_categoricas}")

# Codificar columnas categ√≥ricas autom√°ticamente
for col in cols_categoricas:
    X[col] = X[col].astype('category').cat.codes



if y.isnull().any():
    print(f"‚ö†Ô∏è Target tiene {y.isnull().sum()} NaN. Eliminando esas filas.")
    mask = ~y.isnull()
    X = X[mask]
    y = y[mask]


# Verificar tama√±o final
if X.empty or y.empty:
    print("‚ùå X o y est√°n vac√≠os despu√©s de la limpieza. Revisa tu dataset.")
else:
    print(f"‚úÖ Datos listos: X shape={X.shape}, y shape={y.shape}")

    # Optuna + TimeSeriesSplit
    def objective(trial):
        params = {
            'objective': 'regression',
            'metric': 'rmse',
            'num_leaves': trial.suggest_int('num_leaves', 20, 150),
            'max_depth': trial.suggest_int('max_depth', 3, 15),
            'learning_rate': trial.suggest_float('learning_rate', 1e-3, 0.1, log=True),
            'n_estimators': trial.suggest_int('n_estimators', 100, 1000),
            'subsample': trial.suggest_float('subsample', 0.6, 1.0),
            'colsample_bytree': trial.suggest_float('colsample_bytree', 0.6, 1.0),
            'reg_alpha': trial.suggest_float('reg_alpha', 1e-8, 10.0, log=True),
            'reg_lambda': trial.suggest_float('reg_lambda', 1e-8, 10.0, log=True)
        }

        tscv = TimeSeriesSplit(n_splits=3)
        rmses = []
        for fold, (train_idx, val_idx) in enumerate(tscv.split(X)):
            X_train, X_val = X.iloc[train_idx], X.iloc[val_idx]
            y_train, y_val = y.iloc[train_idx], y.iloc[val_idx]

            if X_train.empty or X_val.empty:
                print(f"‚ö†Ô∏è Fold {fold+1}: conjunto vac√≠o. Saltando.")
                continue

            model = lgb.LGBMRegressor(**params)
            model.fit(
                X_train, y_train,
                eval_set=[(X_val, y_val)],
                callbacks=[lgb.early_stopping(50), lgb.log_evaluation(0)]
            )
            preds = model.predict(X_val)
            rmse = mean_squared_error(y_val, preds, squared=False)
            rmses.append(rmse)

        if len(rmses) == 0:
            return np.inf
        return np.mean(rmses)

    study = optuna.create_study(direction='minimize')
    study.optimize(objective, n_trials=50)
    print("‚úÖ Mejores par√°metros:", study.best_params)

    # Entrenamiento final
    final_model = lgb.LGBMRegressor(**study.best_params)
    final_model.fit(X, y)
    print("‚úÖ Modelo entrenado con los mejores par√°metros.")


[I 2025-05-30 12:26:41,977] A new study created in memory with name: no-name-ed76e028-8ade-44b2-ab1d-67bbce3691e8


Columnas categ√≥ricas: ['cat1', 'cat2', 'cat3', 'brand']
‚úÖ Datos listos: X shape=(31522, 16), y shape=(31522,)
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000310 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[210]	valid_0's rmse: 74.9826
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000407 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[210]	valid_0's rmse: 43.8578
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000383 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[210]	valid_0's rmse: 31.365


[I 2025-05-30 12:26:42,837] Trial 0 finished with value: 50.06846168148483 and parameters: {'num_leaves': 107, 'max_depth': 8, 'learning_rate': 0.0025299934894699766, 'n_estimators': 210, 'subsample': 0.9421279523847893, 'colsample_bytree': 0.6460437051336029, 'reg_alpha': 0.00013936228783999752, 'reg_lambda': 8.575277853457741e-07}. Best is trial 0 with value: 50.06846168148483.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000349 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[197]	valid_0's rmse: 16.226
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000355 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[197]	valid_0's rmse: 8.33896
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000399 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[197]	valid_0's rmse: 5.11226


[I 2025-05-30 12:26:43,361] Trial 1 finished with value: 9.892408256710786 and parameters: {'num_leaves': 50, 'max_depth': 14, 'learning_rate': 0.020167875678519357, 'n_estimators': 197, 'subsample': 0.7542661003984398, 'colsample_bytree': 0.6837755656127211, 'reg_alpha': 1.1748193939551659e-05, 'reg_lambda': 0.001144995144538462}. Best is trial 1 with value: 9.892408256710786.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000363 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[763]	valid_0's rmse: 22.2224
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000297 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[763]	valid_0's rmse: 11.7706
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000397 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[763]	valid_0's rmse: 7.18277


[I 2025-05-30 12:26:44,195] Trial 2 finished with value: 13.725255746234014 and parameters: {'num_leaves': 131, 'max_depth': 4, 'learning_rate': 0.004544903818360334, 'n_estimators': 763, 'subsample': 0.8637502375201896, 'colsample_bytree': 0.9833618568984238, 'reg_alpha': 0.08068123403609838, 'reg_lambda': 1.2318532283653631e-08}. Best is trial 1 with value: 9.892408256710786.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000240 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[653]	valid_0's rmse: 11.7909
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000302 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[706]	valid_0's rmse: 6.34133
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000489 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:26:45,104] Trial 3 finished with value: 7.312670630789184 and parameters: {'num_leaves': 78, 'max_depth': 6, 'learning_rate': 0.02844381166540833, 'n_estimators': 756, 'subsample': 0.8415366386043193, 'colsample_bytree': 0.6051251223732466, 'reg_alpha': 0.0038785559283679087, 'reg_lambda': 2.0810500678074004}. Best is trial 3 with value: 7.312670630789184.


Early stopping, best iteration is:
[264]	valid_0's rmse: 3.80573
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000247 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[928]	valid_0's rmse: 48.0326
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000581 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[928]	valid_0's rmse: 27.5786
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000470 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:26:49,615] Trial 4 finished with value: 31.627108448189187 and parameters: {'num_leaves': 114, 'max_depth': 11, 'learning_rate': 0.001180251284644215, 'n_estimators': 928, 'subsample': 0.8865868185419932, 'colsample_bytree': 0.8071903038447372, 'reg_alpha': 1.1383772108291506e-08, 'reg_lambda': 1.6084700681887801e-06}. Best is trial 3 with value: 7.312670630789184.


Did not meet early stopping. Best iteration is:
[928]	valid_0's rmse: 19.2701
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000281 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[650]	valid_0's rmse: 13.645
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000381 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:26:50,062] Trial 5 finished with value: 8.801613996896975 and parameters: {'num_leaves': 52, 'max_depth': 3, 'learning_rate': 0.03834065694765223, 'n_estimators': 662, 'subsample': 0.9467308505762196, 'colsample_bytree': 0.9869870528050996, 'reg_alpha': 0.0001793382230877243, 'reg_lambda': 3.542961870661167e-06}. Best is trial 3 with value: 7.312670630789184.


Did not meet early stopping. Best iteration is:
[657]	valid_0's rmse: 7.21922
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000539 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[248]	valid_0's rmse: 5.54066
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000250 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000382 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[347]	valid_0's rmse: 6.09553




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000473 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:26:51,298] Trial 6 finished with value: 6.931502808665581 and parameters: {'num_leaves': 113, 'max_depth': 9, 'learning_rate': 0.02288606580112655, 'n_estimators': 596, 'subsample': 0.970496517666358, 'colsample_bytree': 0.8876507367195468, 'reg_alpha': 3.748901743178493e-06, 'reg_lambda': 0.060425783547114705}. Best is trial 6 with value: 6.931502808665581.


Early stopping, best iteration is:
[272]	valid_0's rmse: 2.81831
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000243 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[259]	valid_0's rmse: 14.5712
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000315 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[259]	valid_0's rmse: 7.42728
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000421 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds






[I 2025-05-30 12:26:52,492] Trial 7 finished with value: 8.552784796018617 and parameters: {'num_leaves': 138, 'max_depth': 9, 'learning_rate': 0.014465816958087253, 'n_estimators': 259, 'subsample': 0.9793893856357903, 'colsample_bytree': 0.6331933222459999, 'reg_alpha': 3.810334958942528e-08, 'reg_lambda': 0.2184487612260492}. Best is trial 6 with value: 6.931502808665581.


Did not meet early stopping. Best iteration is:
[259]	valid_0's rmse: 3.65989
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000332 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[370]	valid_0's rmse: 11.7389
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000505 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[229]	valid_0's rmse: 6.20686
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000682 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds






[I 2025-05-30 12:26:55,584] Trial 8 finished with value: 7.329036947810596 and parameters: {'num_leaves': 41, 'max_depth': 10, 'learning_rate': 0.047471698897291394, 'n_estimators': 381, 'subsample': 0.8716984426579222, 'colsample_bytree': 0.9604745701890152, 'reg_alpha': 0.00777057477305393, 'reg_lambda': 0.02610035456919774}. Best is trial 6 with value: 6.931502808665581.


Early stopping, best iteration is:
[109]	valid_0's rmse: 4.04133
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000355 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[812]	valid_0's rmse: 63.0297
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000469 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[812]	valid_0's rmse: 35.5861
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000646 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds






[I 2025-05-30 12:26:59,787] Trial 9 finished with value: 41.186350261576614 and parameters: {'num_leaves': 24, 'max_depth': 4, 'learning_rate': 0.0010789414781458698, 'n_estimators': 812, 'subsample': 0.6675184997829582, 'colsample_bytree': 0.821137715831215, 'reg_alpha': 0.0028516476371153736, 'reg_lambda': 4.8746924201954585}. Best is trial 6 with value: 6.931502808665581.


Did not meet early stopping. Best iteration is:
[812]	valid_0's rmse: 24.9432
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000330 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[211]	valid_0's rmse: 11.5184
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000520 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[109]	valid_0's rmse: 6.1476
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000654 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds






[I 2025-05-30 12:27:04,473] Trial 10 finished with value: 6.8008396901891315 and parameters: {'num_leaves': 82, 'max_depth': 14, 'learning_rate': 0.09910602393306885, 'n_estimators': 465, 'subsample': 0.7516818320305622, 'colsample_bytree': 0.8805528749195524, 'reg_alpha': 5.501944583225293, 'reg_lambda': 0.0014400848484712268}. Best is trial 10 with value: 6.8008396901891315.


Early stopping, best iteration is:
[230]	valid_0's rmse: 2.73651
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000513 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[239]	valid_0's rmse: 11.4106




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000574 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[178]	valid_0's rmse: 5.86998
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000774 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds






[I 2025-05-30 12:27:08,791] Trial 11 finished with value: 6.763822533057813 and parameters: {'num_leaves': 89, 'max_depth': 15, 'learning_rate': 0.093060960320009, 'n_estimators': 512, 'subsample': 0.7433427891259236, 'colsample_bytree': 0.8832386252428115, 'reg_alpha': 3.1146542452187793, 'reg_lambda': 0.0013450573280751573}. Best is trial 11 with value: 6.763822533057813.


Early stopping, best iteration is:
[64]	valid_0's rmse: 3.01093
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000534 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[166]	valid_0's rmse: 11.4815
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000591 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[219]	valid_0's rmse: 5.90925
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000986 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds






[I 2025-05-30 12:27:12,911] Trial 12 finished with value: 6.820234529561472 and parameters: {'num_leaves': 81, 'max_depth': 15, 'learning_rate': 0.09447839772944991, 'n_estimators': 480, 'subsample': 0.7313207320089976, 'colsample_bytree': 0.8813357994252418, 'reg_alpha': 5.355445712249637, 'reg_lambda': 0.000527204441999419}. Best is trial 11 with value: 6.763822533057813.


Early stopping, best iteration is:
[67]	valid_0's rmse: 3.06999
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000387 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[207]	valid_0's rmse: 11.9281




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000485 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[250]	valid_0's rmse: 5.67041
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000884 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds






[I 2025-05-30 12:27:17,413] Trial 13 finished with value: 6.860497015490726 and parameters: {'num_leaves': 91, 'max_depth': 13, 'learning_rate': 0.09984422604761081, 'n_estimators': 407, 'subsample': 0.6128893376694848, 'colsample_bytree': 0.7277673304682762, 'reg_alpha': 7.278864294014847, 'reg_lambda': 5.008348916801774e-05}. Best is trial 11 with value: 6.763822533057813.


Early stopping, best iteration is:
[62]	valid_0's rmse: 2.98293
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000486 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[520]	valid_0's rmse: 15.2794
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000608 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[520]	valid_0's rmse: 7.80124
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000674 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:29,617] Trial 14 finished with value: 9.225703120813503 and parameters: {'num_leaves': 67, 'max_depth': 12, 'learning_rate': 0.007476663172061002, 'n_estimators': 520, 'subsample': 0.7649428584308113, 'colsample_bytree': 0.8998189342371525, 'reg_alpha': 0.37022495651005644, 'reg_lambda': 0.010249577803759857}. Best is trial 11 with value: 6.763822533057813.


Did not meet early stopping. Best iteration is:
[520]	valid_0's rmse: 4.59646
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000571 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[335]	valid_0's rmse: 11.5771




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000311 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[177]	valid_0's rmse: 5.73781
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000423 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:31,134] Trial 15 finished with value: 6.7199948470877615 and parameters: {'num_leaves': 96, 'max_depth': 15, 'learning_rate': 0.05003872255264645, 'n_estimators': 337, 'subsample': 0.7015067326914649, 'colsample_bytree': 0.8407160177782262, 'reg_alpha': 0.2287691533608913, 'reg_lambda': 6.434171596026327e-05}. Best is trial 15 with value: 6.7199948470877615.


Early stopping, best iteration is:
[121]	valid_0's rmse: 2.84511
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000272 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[333]	valid_0's rmse: 11.4203




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000368 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[230]	valid_0's rmse: 5.72283
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000409 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:32,042] Trial 16 finished with value: 6.684901249540459 and parameters: {'num_leaves': 98, 'max_depth': 15, 'learning_rate': 0.052546534466147356, 'n_estimators': 353, 'subsample': 0.6784126910294298, 'colsample_bytree': 0.7519597475226781, 'reg_alpha': 0.2514076975746861, 'reg_lambda': 3.877819451884712e-05}. Best is trial 16 with value: 6.684901249540459.


Early stopping, best iteration is:
[120]	valid_0's rmse: 2.91155
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000239 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[117]	valid_0's rmse: 12.8018
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000287 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[

[I 2025-05-30 12:27:32,576] Trial 17 finished with value: 7.270527841835 and parameters: {'num_leaves': 103, 'max_depth': 12, 'learning_rate': 0.047684099113942564, 'n_estimators': 117, 'subsample': 0.6797000433871047, 'colsample_bytree': 0.7541907372433334, 'reg_alpha': 0.04881891863462018, 'reg_lambda': 3.202358759972291e-05}. Best is trial 16 with value: 6.684901249540459.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000421 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[117]	valid_0's rmse: 2.98727
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000266 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[316]	valid_0's rmse: 15.4856
[LightGBM] [Info] Auto-choosing col-



Did not meet early stopping. Best iteration is:
[316]	valid_0's rmse: 8.03835
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000486 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:34,307] Trial 18 finished with value: 9.36991810307778 and parameters: {'num_leaves': 127, 'max_depth': 13, 'learning_rate': 0.010588548497043007, 'n_estimators': 316, 'subsample': 0.6467288136056719, 'colsample_bytree': 0.7566681010231738, 'reg_alpha': 0.2950444152734245, 'reg_lambda': 7.491604084499718e-08}. Best is trial 16 with value: 6.684901249540459.


Did not meet early stopping. Best iteration is:
[316]	valid_0's rmse: 4.58581
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000227 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[286]	valid_0's rmse: 11.4037
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000304 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:34,837] Trial 19 finished with value: 6.83578941557128 and parameters: {'num_leaves': 147, 'max_depth': 7, 'learning_rate': 0.06315717648692007, 'n_estimators': 314, 'subsample': 0.7000566051824085, 'colsample_bytree': 0.8410388508538222, 'reg_alpha': 0.40450197630903373, 'reg_lambda': 3.5196307834119455e-05}. Best is trial 16 with value: 6.684901249540459.


Did not meet early stopping. Best iteration is:
[277]	valid_0's rmse: 6.05158
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000498 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[93]	valid_0's rmse: 3.05207
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000256 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[3



Did not meet early stopping. Best iteration is:
[374]	valid_0's rmse: 12.8707
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000410 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:36,524] Trial 20 finished with value: 15.011310903572884 and parameters: {'num_leaves': 99, 'max_depth': 11, 'learning_rate': 0.006063752900931478, 'n_estimators': 374, 'subsample': 0.8011731598780854, 'colsample_bytree': 0.7041326878304884, 'reg_alpha': 0.017494869763096218, 'reg_lambda': 5.717375074576184e-06}. Best is trial 16 with value: 6.684901249540459.


Did not meet early stopping. Best iteration is:
[374]	valid_0's rmse: 8.34093
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000275 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[343]	valid_0's rmse: 11.0651
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000301 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[168]	valid_0's rmse: 5.92534
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000461 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds






[I 2025-05-30 12:27:37,564] Trial 21 finished with value: 6.5306567008784215 and parameters: {'num_leaves': 69, 'max_depth': 15, 'learning_rate': 0.061470173889324055, 'n_estimators': 602, 'subsample': 0.710796918776192, 'colsample_bytree': 0.9376747498717732, 'reg_alpha': 0.45165042423539836, 'reg_lambda': 0.00018406997413870804}. Best is trial 21 with value: 6.5306567008784215.


Early stopping, best iteration is:
[377]	valid_0's rmse: 2.60151
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000306 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[368]	valid_0's rmse: 11.2607
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000464 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[289]	valid_0's rmse: 5.99083




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000457 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:38,608] Trial 22 finished with value: 6.889585545451644 and parameters: {'num_leaves': 69, 'max_depth': 15, 'learning_rate': 0.03324038425406622, 'n_estimators': 681, 'subsample': 0.6047550529774617, 'colsample_bytree': 0.9377084903337818, 'reg_alpha': 0.8416123327210978, 'reg_lambda': 6.907834758254953e-05}. Best is trial 21 with value: 6.5306567008784215.


Early stopping, best iteration is:
[169]	valid_0's rmse: 3.41719
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000318 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[115]	valid_0's rmse: 12.5239




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000326 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[114]	valid_0's rmse: 6.21453
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000433 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:39,039] Trial 23 finished with value: 7.317697364643581 and parameters: {'num_leaves': 68, 'max_depth': 14, 'learning_rate': 0.05499031546089735, 'n_estimators': 115, 'subsample': 0.7080630911742561, 'colsample_bytree': 0.769721668518928, 'reg_alpha': 0.0014453923598202498, 'reg_lambda': 0.0001007384836581504}. Best is trial 21 with value: 6.5306567008784215.


Did not meet early stopping. Best iteration is:
[114]	valid_0's rmse: 3.21466
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000230 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[585]	valid_0's rmse: 11.9457
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000304 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[577]	valid_0's rmse: 5.84317
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000493 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:40,806] Trial 24 finished with value: 6.873167974249212 and parameters: {'num_leaves': 96, 'max_depth': 13, 'learning_rate': 0.018693327146156364, 'n_estimators': 586, 'subsample': 0.6425490174498426, 'colsample_bytree': 0.8422052527110033, 'reg_alpha': 0.03923690291751442, 'reg_lambda': 2.935509405020229e-07}. Best is trial 21 with value: 6.5306567008784215.


Early stopping, best iteration is:
[344]	valid_0's rmse: 2.83064
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000280 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[411]	valid_0's rmse: 11.5577




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000414 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[386]	valid_0's rmse: 5.72805




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000473 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:42,269] Trial 25 finished with value: 6.6935636128763605 and parameters: {'num_leaves': 120, 'max_depth': 15, 'learning_rate': 0.029502143071608644, 'n_estimators': 417, 'subsample': 0.7927808915532576, 'colsample_bytree': 0.9277411709202209, 'reg_alpha': 0.11375510539860594, 'reg_lambda': 1.1513961068048012e-05}. Best is trial 21 with value: 6.5306567008784215.


Early stopping, best iteration is:
[211]	valid_0's rmse: 2.79491
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000395 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[432]	valid_0's rmse: 10.9848




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000370 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[181]	valid_0's rmse: 5.72421
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000635 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:43,119] Trial 26 finished with value: 6.525691232054896 and parameters: {'num_leaves': 121, 'max_depth': 12, 'learning_rate': 0.06759583453576361, 'n_estimators': 437, 'subsample': 0.7861392057142206, 'colsample_bytree': 0.9325626481664575, 'reg_alpha': 1.2230768448462095, 'reg_lambda': 0.007263607648264275}. Best is trial 26 with value: 6.525691232054896.


Early stopping, best iteration is:
[89]	valid_0's rmse: 2.8681
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000261 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[335]	valid_0's rmse: 11.5085




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000321 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[139]	valid_0's rmse: 5.8519
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000720 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:43,914] Trial 27 finished with value: 6.754969421056817 and parameters: {'num_leaves': 123, 'max_depth': 12, 'learning_rate': 0.059659570065257704, 'n_estimators': 633, 'subsample': 0.7997685399550791, 'colsample_bytree': 0.9250613653226901, 'reg_alpha': 1.6368793178056449, 'reg_lambda': 0.009990337363037817}. Best is trial 26 with value: 6.525691232054896.


Early stopping, best iteration is:
[98]	valid_0's rmse: 2.90453
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000247 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[327]	valid_0's rmse: 11.2908
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000368 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[133]	valid_0's rmse: 6.27099
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000514 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[82]	valid_0's rmse: 3.624


[I 2025-05-30 12:27:44,514] Trial 28 finished with value: 7.06192532444226 and parameters: {'num_leaves': 60, 'max_depth': 11, 'learning_rate': 0.06988415300367372, 'n_estimators': 999, 'subsample': 0.7241524981741747, 'colsample_bytree': 0.9562347380236931, 'reg_alpha': 0.0005228751575010237, 'reg_lambda': 0.0041481729017549766}. Best is trial 26 with value: 6.525691232054896.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000320 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[223]	valid_0's rmse: 18.0129
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000463 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[223]	valid_0's rmse: 9.41266
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000478 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:45,629] Trial 29 finished with value: 11.047766733744337 and parameters: {'num_leaves': 109, 'max_depth': 13, 'learning_rate': 0.013319184195676683, 'n_estimators': 223, 'subsample': 0.6594992684179961, 'colsample_bytree': 0.6802116465100432, 'reg_alpha': 2.9303199056741685e-05, 'reg_lambda': 0.2563406328444075}. Best is trial 26 with value: 6.525691232054896.


Did not meet early stopping. Best iteration is:
[223]	valid_0's rmse: 5.71774
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000346 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[263]	valid_0's rmse: 56.863
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000310 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[263]	valid_0's rmse: 33.0699
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000517 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:47,262] Trial 30 finished with value: 37.76117262033154 and parameters: {'num_leaves': 136, 'max_depth': 14, 'learning_rate': 0.003291362410044067, 'n_estimators': 263, 'subsample': 0.8247540259086401, 'colsample_bytree': 0.7855135034442529, 'reg_alpha': 0.016056359035223577, 'reg_lambda': 0.0003490523053249062}. Best is trial 26 with value: 6.525691232054896.


Did not meet early stopping. Best iteration is:
[263]	valid_0's rmse: 23.3506
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000257 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[447]	valid_0's rmse: 11.3447
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000305 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[256]	valid_0's rmse: 5.71281
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000486 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:48,503] Trial 31 finished with value: 6.618527550283381 and parameters: {'num_leaves': 117, 'max_depth': 15, 'learning_rate': 0.037498649228288945, 'n_estimators': 453, 'subsample': 0.7945793589113805, 'colsample_bytree': 0.915614319937519, 'reg_alpha': 0.0727273939240413, 'reg_lambda': 6.9809209681895365e-06}. Best is trial 26 with value: 6.525691232054896.


Early stopping, best iteration is:
[172]	valid_0's rmse: 2.79811
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000285 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[435]	valid_0's rmse: 11.3026
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000384 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[239]	valid_0's rmse: 5.78685




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000470 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:49,692] Trial 32 finished with value: 6.65872599798237 and parameters: {'num_leaves': 117, 'max_depth': 14, 'learning_rate': 0.03807654319156044, 'n_estimators': 436, 'subsample': 0.7740945892855403, 'colsample_bytree': 0.9148896815701894, 'reg_alpha': 0.9954805950566166, 'reg_lambda': 0.0002158881550158855}. Best is trial 26 with value: 6.525691232054896.


Early stopping, best iteration is:
[158]	valid_0's rmse: 2.88675
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000254 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[454]	valid_0's rmse: 11.3498
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000372 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[446]	valid_0's rmse: 5.82223
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000174 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:51,182] Trial 33 finished with value: 6.638391708606869 and parameters: {'num_leaves': 118, 'max_depth': 14, 'learning_rate': 0.036715176638306375, 'n_estimators': 456, 'subsample': 0.7748038489717731, 'colsample_bytree': 0.9984204597548869, 'reg_alpha': 2.763051342979529, 'reg_lambda': 0.00023173041118769937}. Best is trial 26 with value: 6.525691232054896.


Early stopping, best iteration is:
[191]	valid_0's rmse: 2.74319
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000307 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[538]	valid_0's rmse: 11.4154
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000316 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[446]	valid_0's rmse: 5.70708
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000479 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:53,078] Trial 34 finished with value: 6.604396347043122 and parameters: {'num_leaves': 141, 'max_depth': 14, 'learning_rate': 0.023842804494135707, 'n_estimators': 570, 'subsample': 0.8294641311736256, 'colsample_bytree': 0.9992413266583288, 'reg_alpha': 1.3380352520009962, 'reg_lambda': 6.78384606120031e-07}. Best is trial 26 with value: 6.525691232054896.


Early stopping, best iteration is:
[254]	valid_0's rmse: 2.69073
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000253 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[556]	valid_0's rmse: 11.6941




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000349 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[397]	valid_0's rmse: 5.74114
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000463 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[256]	valid_0's rmse: 2.72756


[I 2025-05-30 12:27:55,015] Trial 35 finished with value: 6.720950535813891 and parameters: {'num_leaves': 148, 'max_depth': 13, 'learning_rate': 0.022412457793239395, 'n_estimators': 556, 'subsample': 0.8370658142509787, 'colsample_bytree': 0.9660705015216718, 'reg_alpha': 0.06517508322593776, 'reg_lambda': 4.60270484728343e-07}. Best is trial 26 with value: 6.525691232054896.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000313 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[458]	valid_0's rmse: 11.8459
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000400 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[679]	valid_0's rmse: 5.86197




[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000187 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:57,558] Trial 36 finished with value: 6.812285207024984 and parameters: {'num_leaves': 137, 'max_depth': 12, 'learning_rate': 0.01703392542580652, 'n_estimators': 704, 'subsample': 0.906707815484432, 'colsample_bytree': 0.9447771659100639, 'reg_alpha': 0.9968951058571971, 'reg_lambda': 1.3077538779233563e-08}. Best is trial 26 with value: 6.525691232054896.


Early stopping, best iteration is:
[364]	valid_0's rmse: 2.72894
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000285 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[352]	valid_0's rmse: 11.1388
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000432 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[125]	valid_0's rmse: 5.69989
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000688 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:27:58,446] Trial 37 finished with value: 6.5692773335768875 and parameters: {'num_leaves': 128, 'max_depth': 14, 'learning_rate': 0.07214600295650511, 'n_estimators': 812, 'subsample': 0.8210891217347276, 'colsample_bytree': 0.9826532084416363, 'reg_alpha': 9.770386512072635e-07, 'reg_lambda': 1.4807179515327287e-06}. Best is trial 26 with value: 6.525691232054896.


Early stopping, best iteration is:
[85]	valid_0's rmse: 2.86916
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000298 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[380]	valid_0's rmse: 11.0981




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000343 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[134]	valid_0's rmse: 5.86596


[I 2025-05-30 12:27:59,183] Trial 38 finished with value: 6.569896506913428 and parameters: {'num_leaves': 128, 'max_depth': 10, 'learning_rate': 0.08012980747769322, 'n_estimators': 854, 'subsample': 0.8967164302214947, 'colsample_bytree': 0.9803740988579297, 'reg_alpha': 8.605760410874156e-07, 'reg_lambda': 1.6754880719069437e-06}. Best is trial 26 with value: 6.525691232054896.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000616 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[71]	valid_0's rmse: 2.74565
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000411 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[391]	valid_0's rmse: 11.0854
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the o



Early stopping, best iteration is:
[283]	valid_0's rmse: 5.87122


[I 2025-05-30 12:28:00,082] Trial 39 finished with value: 6.543244777011494 and parameters: {'num_leaves': 130, 'max_depth': 10, 'learning_rate': 0.0737738515334203, 'n_estimators': 825, 'subsample': 0.9247827974579985, 'colsample_bytree': 0.9796023139062187, 'reg_alpha': 9.189038440728754e-07, 'reg_lambda': 8.60884484791256e-08}. Best is trial 26 with value: 6.525691232054896.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000481 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[83]	valid_0's rmse: 2.67314
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000356 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[406]	valid_0's rmse: 11.8044
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the o



Early stopping, best iteration is:
[542]	valid_0's rmse: 5.83398
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000673 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:28:00,949] Trial 40 finished with value: 6.875350089045649 and parameters: {'num_leaves': 110, 'max_depth': 8, 'learning_rate': 0.07222509909499499, 'n_estimators': 884, 'subsample': 0.9475135488291649, 'colsample_bytree': 0.9771675959269472, 'reg_alpha': 2.8171559173344515e-07, 'reg_lambda': 7.197940686089242e-08}. Best is trial 26 with value: 6.525691232054896.


Early stopping, best iteration is:
[77]	valid_0's rmse: 2.98763
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000312 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[386]	valid_0's rmse: 10.9515
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000409 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[127]	valid_0's rmse: 5.87851
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000185 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:28:01,714] Trial 41 finished with value: 6.518257139179563 and parameters: {'num_leaves': 130, 'max_depth': 10, 'learning_rate': 0.0804244285375761, 'n_estimators': 823, 'subsample': 0.9191352930911614, 'colsample_bytree': 0.9648408938282216, 'reg_alpha': 9.91685428573453e-07, 'reg_lambda': 1.717478696941733e-06}. Best is trial 41 with value: 6.518257139179563.


Early stopping, best iteration is:
[82]	valid_0's rmse: 2.7248
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000317 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[765]	valid_0's rmse: 35.0404
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000469 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Did not meet early stopping. Best iteration is:
[765]	valid_0's rmse: 20.0623
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000484 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:28:06,402] Trial 42 finished with value: 22.95441133609465 and parameters: {'num_leaves': 129, 'max_depth': 10, 'learning_rate': 0.0019326575321908493, 'n_estimators': 765, 'subsample': 0.9178851842888274, 'colsample_bytree': 0.9510050339974127, 'reg_alpha': 1.2343037170543235e-05, 'reg_lambda': 1.0468997697744974e-07}. Best is trial 41 with value: 6.518257139179563.


Did not meet early stopping. Best iteration is:
[765]	valid_0's rmse: 13.7606
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000350 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[275]	valid_0's rmse: 11.0696
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000396 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[113]	valid_0's rmse: 5.87691
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000460 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:28:07,024] Trial 43 finished with value: 6.5483212595272375 and parameters: {'num_leaves': 132, 'max_depth': 9, 'learning_rate': 0.0690557454758165, 'n_estimators': 951, 'subsample': 0.9990610701757812, 'colsample_bytree': 0.965200860860459, 'reg_alpha': 3.1621603905720944e-07, 'reg_lambda': 1.5994584612492646e-08}. Best is trial 41 with value: 6.518257139179563.


Early stopping, best iteration is:
[81]	valid_0's rmse: 2.69849
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000357 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[235]	valid_0's rmse: 11.5455
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000342 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[183]	valid_0's rmse: 6.19106
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000551 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:28:07,591] Trial 44 finished with value: 7.073654729958181 and parameters: {'num_leaves': 46, 'max_depth': 8, 'learning_rate': 0.07954379457376676, 'n_estimators': 971, 'subsample': 0.8577965250791914, 'colsample_bytree': 0.8640829172125556, 'reg_alpha': 5.217210990238481e-08, 'reg_lambda': 1.1837966117654667e-08}. Best is trial 41 with value: 6.518257139179563.


Early stopping, best iteration is:
[133]	valid_0's rmse: 3.48441
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000319 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[393]	valid_0's rmse: 11.4208




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000396 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[160]	valid_0's rmse: 6.04353
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000961 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:28:08,541] Trial 45 finished with value: 6.715793832175159 and parameters: {'num_leaves': 145, 'max_depth': 9, 'learning_rate': 0.042563970712285584, 'n_estimators': 924, 'subsample': 0.9971565120749547, 'colsample_bytree': 0.9043246939100541, 'reg_alpha': 5.618254324759246e-05, 'reg_lambda': 4.632538624799466e-08}. Best is trial 41 with value: 6.518257139179563.


Early stopping, best iteration is:
[134]	valid_0's rmse: 2.68304
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000306 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Did not meet early stopping. Best iteration is:
[725]	valid_0's rmse: 11.2201
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000462 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[216]	valid_0's rmse: 6.03375
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000578 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[209]	valid_0's rmse: 2.70072


[I 2025-05-30 12:28:09,873] Trial 46 finished with value: 6.651534159271841 and parameters: {'num_leaves': 133, 'max_depth': 9, 'learning_rate': 0.0275190838928977, 'n_estimators': 738, 'subsample': 0.9313466930137847, 'colsample_bytree': 0.9655188167673776, 'reg_alpha': 1.3502982662585628e-07, 'reg_lambda': 2.429500713823747e-07}. Best is trial 41 with value: 6.518257139179563.


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000365 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[328]	valid_0's rmse: 11.456
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000556 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds




Early stopping, best iteration is:
[430]	valid_0's rmse: 5.96697
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000503 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:28:10,640] Trial 47 finished with value: 6.8903796152373085 and parameters: {'num_leaves': 140, 'max_depth': 7, 'learning_rate': 0.062400799307377935, 'n_estimators': 920, 'subsample': 0.9657181833034952, 'colsample_bytree': 0.9427530264131514, 'reg_alpha': 3.13645642504543e-06, 'reg_lambda': 2.4799030180659712e-08}. Best is trial 41 with value: 6.518257139179563.


Early stopping, best iteration is:
[92]	valid_0's rmse: 3.24813
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000318 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[326]	valid_0's rmse: 11.4433




[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000345 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:28:11,355] Trial 48 finished with value: 6.923155652307055 and parameters: {'num_leaves': 74, 'max_depth': 10, 'learning_rate': 0.08102847453944902, 'n_estimators': 815, 'subsample': 0.9891134300837775, 'colsample_bytree': 0.9669611840497322, 'reg_alpha': 1.0137640264307836e-08, 'reg_lambda': 0.10847931138711994}. Best is trial 41 with value: 6.518257139179563.


Early stopping, best iteration is:
[223]	valid_0's rmse: 6.06553
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000566 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[72]	valid_0's rmse: 3.26061
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000275 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1942
[LightGBM] [Info] Number of data points in the train set: 7882, number of used features: 16
[LightGBM] [Info] Start training from score 134.240064
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[388]	valid_0's rmse: 11.948



[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000405 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 1978
[LightGBM] [Info] Number of data points in the train set: 15762, number of used features: 16
[LightGBM] [Info] Start training from score 75.331341
Training until validation scores don't improve for 50 rounds


[I 2025-05-30 12:28:11,972] Trial 49 finished with value: 7.496030586026488 and parameters: {'num_leaves': 37, 'max_depth': 5, 'learning_rate': 0.04485811502729954, 'n_estimators': 634, 'subsample': 0.8759515711439879, 'colsample_bytree': 0.8656833410912196, 'reg_alpha': 2.0419205412424155e-06, 'reg_lambda': 1.7657669987870907e-07}. Best is trial 41 with value: 6.518257139179563.


Early stopping, best iteration is:
[552]	valid_0's rmse: 6.35989
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000770 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2028
[LightGBM] [Info] Number of data points in the train set: 23642, number of used features: 16
[LightGBM] [Info] Start training from score 52.155359
Training until validation scores don't improve for 50 rounds
Early stopping, best iteration is:
[177]	valid_0's rmse: 4.17988
‚úÖ Mejores par√°metros: {'num_leaves': 130, 'max_depth': 10, 'learning_rate': 0.0804244285375761, 'n_estimators': 823, 'subsample': 0.9191352930911614, 'colsample_bytree': 0.9648408938282216, 'reg_alpha': 9.91685428573453e-07, 'reg_lambda': 1.717478696941733e-06}
[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000697 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 2072
[Ligh

In [21]:
print("Mejores par√°metros encontrados:", study.best_params)

Mejores par√°metros encontrados: {'num_leaves': 144, 'max_depth': 15, 'learning_rate': 0.07766119322368795, 'n_estimators': 728, 'subsample': 0.6188111024172903, 'colsample_bytree': 0.998780906695816, 'reg_alpha': 0.0029833791412988433, 'reg_lambda': 5.520787178879811e-07}


In [27]:
# üèÅ Entrenamiento final con los mejores hiperpar√°metros
final_model = lgb.LGBMRegressor(**study.best_params)
final_model.fit(X, y)
print("‚úÖ Modelo final entrenado.")

# üìÖ Preparar conjunto de prueba
X_test = test_data.drop(columns=['periodo_dt','tn_target','tn'], errors='ignore')

# Codificar columnas categ√≥ricas igual que en entrenamiento
cols_categoricas_test = X_test.select_dtypes(include=['object', 'category']).columns.tolist()
print(f"Columnas categ√≥ricas en test: {cols_categoricas_test}")

for col in cols_categoricas_test:
    X_test[col] = X_test[col].astype('category').cat.codes

# Convertir a float32 para consistencia
X_test = X_test.astype(np.float32)

# Filtrar solo productos a predecir
productos_a_predecir = pd.read_csv("datasets/product_id_apredecir201912.csv")
X_test = X_test[X_test['product_id'].isin(productos_a_predecir['product_id'])]

# Verificar que no est√© vac√≠o
if X_test.empty:
    print("‚ùå X_test est√° vac√≠o despu√©s del filtrado. Revisa los datos.")
else:
    # üîÆ Hacer predicciones
    preds = final_model.predict(X_test)

    # üìù Crear DataFrame con resultados
    result = pd.DataFrame({
        "product_id": X_test["product_id"].values,
        "tn": preds
    })

    # üíæ Guardar en CSV
    result.to_csv("./kaggle/optimized_lgb.csv", index=False)
    print("‚úÖ Predicciones guardadas en ./kaggle/optimized_lgb.csv")


[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000213 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 2072
[LightGBM] [Info] Number of data points in the train set: 31522, number of used features: 16
[LightGBM] [Info] Start training from score 39.421567
‚úÖ Modelo final entrenado.
Columnas categ√≥ricas en test: ['cat1', 'cat2', 'cat3', 'brand']
‚úÖ Predicciones guardadas en ./kaggle/optimized_lgb.csv


In [28]:
result['product_id'] = result['product_id'].astype(int)
result.to_csv("./kaggle/optimized_lgb.csv", index=False)
result

Unnamed: 0,product_id,tn
0,20001,21.206227
1,20002,22.163006
2,20003,12.595877
3,20004,22.879437
4,20005,-5.844806
...,...,...
775,21263,-0.141418
776,21265,-0.044921
777,21266,-0.044921
778,21267,-0.045546
