In [20]:
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np

In [21]:
import xgboost as xgb
import lightgbm as gbm
from sklearn.ensemble import RandomForestClassifier, AdaBoostClassifier
from sklearn.linear_model import LogisticRegression

In [22]:
from sklearn.model_selection import train_test_split, cross_val_score, cross_validate, StratifiedKFold, GridSearchCV
from sklearn.metrics import f1_score, classification_report, confusion_matrix, make_scorer

from functools import partial

In [23]:
train = pd.read_parquet('../data/processed/train.parquet')
test = pd.read_parquet('../data/processed/test.parquet')

In [24]:
metric = partial(f1_score, average='macro')
score = make_scorer(f1_score, average='macro')

In [26]:
from imblearn.over_sampling import SMOTE
resampler = SMOTE(random_state=0, k_neighbors=3)
X, y = train.loc[:, ~train.columns.isin(['revenue', "id"])], train.revenue

In [27]:
X_train, X_test, y_train, y_test = train_test_split(X,y, stratify=y, test_size=0.2, random_state=42)
X_train, X_val, y_train, y_val = train_test_split(X_train, y_train, stratify=y_train, test_size=0.2, random_state=42)

In [28]:
import lightgbm as lgb
import numpy as np
import sklearn.datasets
import sklearn.metrics
from sklearn.model_selection import train_test_split

import optuna

In [29]:
# FYI: Objective functions can take additional arguments
# (https://optuna.readthedocs.io/en/stable/faq.html#objective-func-additional-args).
def objective(trial):
    data, target = sklearn.datasets.load_breast_cancer(return_X_y=True)
    train_x, valid_x, train_y, valid_y = train_test_split(data, target, test_size=0.25)
    dtrain = lgb.Dataset(train_x, label=train_y)

    param = {
        "objective": "binary",
        "metric": "binary_logloss",
        "verbosity": -1,
        "boosting_type": "gbdt",
        "lambda_l1": trial.suggest_float("lambda_l1", 1e-8, 10.0, log=True),
        "lambda_l2": trial.suggest_float("lambda_l2", 1e-8, 10.0, log=True),
        "num_leaves": trial.suggest_int("num_leaves", 2, 256),
        "feature_fraction": trial.suggest_float("feature_fraction", 0.4, 1.0),
        "bagging_fraction": trial.suggest_float("bagging_fraction", 0.4, 1.0),
        "bagging_freq": trial.suggest_int("bagging_freq", 1, 7),
        "min_child_samples": trial.suggest_int("min_child_samples", 5, 100),
    }

    gbm = lgb.train(param, dtrain)
    preds = gbm.predict(valid_x)
    pred_labels = np.rint(preds)
    accuracy = sklearn.metrics.accuracy_score(valid_y, pred_labels)
    return accuracy

In [30]:
def objective_challenge(trial):

    param = {
        "n_estimators":trial.suggest_int("n_estimators", 300, 500, step=50),
        "objective": "binary",
        "random_state": 42,
        "verbosity": 0,
        "boosting_type": "goss",
        "lambda_l1": trial.suggest_float("lambda_l1", 1e-8, 10.0, log=True),
        "lambda_l2": trial.suggest_float("lambda_l2", 1e-8, 10.0, log=True),
        "max_depth": trial.suggest_int("max_depth", 8,25, step=3),
        "num_leaves": trial.suggest_int("num_leaves", 2, 256),
    }

    fit_params = {
        "eval_set":[(X_train, y_train), (X_val, y_val)], 
        "early_stopping_rounds":15,
        "eval_metric":[lambda y_true, y_pred: ("F1_MACRO", metric(y_true, np.round(y_pred)), True)],
        "feature_name":X_train.columns.tolist(),
        "categorical_feature":["Month", "TrafficType", "Browser", "SpecialDay", "OperatingSystems", "Region", "VisitorType", "Weekend"]
    }
    
    gbm = lgb.LGBMClassifier(**param, verbose=0)
    
    # In a better scenario, I might use this code.
#     f1_cross = cross_val_score(
#         gbm, X_train, y_train, 
#         cv=StratifiedKFold(3), 
#         scoring=score,
#         fit_params=fit_params
#     )
#     return np.mean(f1_cross)

    gbm.fit(X_train, y_train, **fit_params)
    
    return metric(y_val, gbm.predict(X_val))

In [31]:
study = optuna.create_study(direction="maximize")
study.optimize(objective_challenge, n_trials=120)

print("Number of finished trials: {}".format(len(study.trials)))

print("Best trial:")
trial = study.best_trial

print("  Value: {}".format(trial.value))

print("  Params: ")
for key, value in trial.params.items():
    print("    {}: {}".format(key, value))

[I 2021-03-08 12:34:46,634] A new study created in memory with name: no-name-ddd80cbb-9996-462e-960a-7b9a835b56be
  low=low, old_high=old_high, high=high, step=step
New categorical_feature is ['Browser', 'Month', 'OperatingSystems', 'Region', 'SpecialDay', 'TrafficType', 'VisitorType', 'Weekend']
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.




[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386198	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357678	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314111	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336961	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292058	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320339	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27341	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.305812	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256625	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.29468	valid_1's F1_MACRO: 0.646087
[7]	training's binary_logloss: 0.24193	training's F1_MACRO: 0.7534	valid_1's binary_logloss: 0.284935	valid_1's F1_MACRO: 0.688834
[8]	tra

[I 2021-03-08 12:34:50,922] Trial 0 finished with value: 0.807009447544516 and parameters: {'n_estimators': 300, 'lambda_l1': 6.133071198921238e-07, 'lambda_l2': 9.151875734603427e-07, 'max_depth': 20, 'num_leaves': 213}. Best is trial 0 with value: 0.807009447544516.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377866	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386276	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342421	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.358297	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314817	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.337505	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292509	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.321316	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.274007	training's F1_MACRO: 0.582966	valid_1's binary_logloss: 0.308315	valid_1's F1_MACRO: 0.555825
[6]	training's binary_logloss: 0.257184	training's F1_MACRO: 0.690297	valid_1's binary_logloss: 0.296673	valid_1's F1_MACRO: 0.646971
[7]	training'

[I 2021-03-08 12:34:56,286] Trial 1 finished with value: 0.8003705845248108 and parameters: {'n_estimators': 300, 'lambda_l1': 2.7734928507610107e-06, 'lambda_l2': 0.046323395551936715, 'max_depth': 14, 'num_leaves': 221}. Best is trial 0 with value: 0.807009447544516.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.380762	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389008	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.346592	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360993	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.320156	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.340198	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.298648	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.323561	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.280832	training's F1_MACRO: 0.467809	valid_1's binary_logloss: 0.309801	valid_1's F1_MACRO: 0.463072
[6]	training's binary_logloss: 0.264034	training's F1_MACRO: 0.668995	valid_1's binary_logloss: 0.298167	valid_1's F1_MACRO: 0.652886
[7]	training'

[I 2021-03-08 12:35:01,714] Trial 2 finished with value: 0.81677257483596 and parameters: {'n_estimators': 400, 'lambda_l1': 5.030505346246275e-07, 'lambda_l2': 0.3742497979538916, 'max_depth': 11, 'num_leaves': 191}. Best is trial 2 with value: 0.81677257483596.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377312	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386158	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341574	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357902	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314132	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336528	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292124	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32051	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273594	training's F1_MACRO: 0.590719	valid_1's binary_logloss: 0.307177	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.25682	training's F1_MACRO: 0.697307	valid_1's binary_logloss: 0.295386	valid_1's F1_MACRO: 0.653363
[7]	training's 

[I 2021-03-08 12:35:06,607] Trial 3 finished with value: 0.8050942773517227 and parameters: {'n_estimators': 300, 'lambda_l1': 0.0018470991576140473, 'lambda_l2': 6.821404453380125e-07, 'max_depth': 14, 'num_leaves': 218}. Best is trial 2 with value: 0.81677257483596.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377187	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386238	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341351	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357646	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314176	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336603	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292122	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320053	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273499	training's F1_MACRO: 0.585998	valid_1's binary_logloss: 0.305633	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256682	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.294412	valid_1's F1_MACRO: 0.658751
[7]	training's

[I 2021-03-08 12:35:11,215] Trial 4 finished with value: 0.8097304744682683 and parameters: {'n_estimators': 450, 'lambda_l1': 2.421234135344689e-07, 'lambda_l2': 0.003944092453689924, 'max_depth': 17, 'num_leaves': 129}. Best is trial 2 with value: 0.81677257483596.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377164	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386221	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341331	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357632	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.31416	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336613	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292113	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32008	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273492	training's F1_MACRO: 0.587892	valid_1's binary_logloss: 0.305754	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256683	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.294541	valid_1's F1_MACRO: 0.658751
[7]	training's b

[I 2021-03-08 12:35:18,491] Trial 5 finished with value: 0.807009447544516 and parameters: {'n_estimators': 400, 'lambda_l1': 0.007277599447534378, 'lambda_l2': 2.879267902102317e-06, 'max_depth': 23, 'num_leaves': 122}. Best is trial 2 with value: 0.81677257483596.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.377221	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386265	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341393	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357678	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.31421	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336859	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292148	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320272	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273502	training's F1_MACRO: 0.589778	valid_1's binary_logloss: 0.305734	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.25665	training's F1_MACRO: 0.696303	valid_1's binary_logloss: 0.294448	valid_1's F1_MACRO: 0.655617
[7]	training's binary_logloss: 0.242004	training's F1_MACRO: 0.758858	valid_1's

[I 2021-03-08 12:35:23,327] Trial 6 finished with value: 0.8113686902075627 and parameters: {'n_estimators': 400, 'lambda_l1': 4.820323998449861e-06, 'lambda_l2': 0.006821879980297473, 'max_depth': 20, 'num_leaves': 166}. Best is trial 2 with value: 0.81677257483596.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377883	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.385766	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342126	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.3574	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314894	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33652	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292958	training's F1_MACRO: 0.459373	valid_1's binary_logloss: 0.319079	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.274449	training's F1_MACRO: 0.601866	valid_1's binary_logloss: 0.306552	valid_1's F1_MACRO: 0.574269
[6]	training's binary_logloss: 0.25757	training's F1_MACRO: 0.700058	valid_1's binary_logloss: 0.294909	valid_1's F1_MACRO: 0.660942
[7]	training's bi

[I 2021-03-08 12:35:28,213] Trial 7 finished with value: 0.8197518825622048 and parameters: {'n_estimators': 400, 'lambda_l1': 6.416593051802503e-07, 'lambda_l2': 1.736720097074857e-08, 'max_depth': 11, 'num_leaves': 248}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386199	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.3576	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336555	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320001	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273437	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305586	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256616	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294194	valid_1's F1_MACRO: 0.656527
[7]	training's binary_logloss: 0.24199	training's F1_MACRO: 0.754337	valid_1's 

[I 2021-03-08 12:35:30,244] Trial 8 finished with value: 0.81299365072143 and parameters: {'n_estimators': 400, 'lambda_l1': 0.00011748051393132616, 'lambda_l2': 3.16467232856096e-05, 'max_depth': 20, 'num_leaves': 211}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.379932	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386454	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.346602	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.358192	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.321742	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.338038	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.301176	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320536	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.284646	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.307236	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.269551	training's F1_MACRO: 0.683487	valid_1's binary_logloss: 0.29534	valid_1's F1_MACRO: 0.662453
[7]	training's

[I 2021-03-08 12:35:33,457] Trial 9 finished with value: 0.7978930316994833 and parameters: {'n_estimators': 350, 'lambda_l1': 2.369961396673891e-05, 'lambda_l2': 2.4062293119841455e-08, 'max_depth': 20, 'num_leaves': 39}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.389585	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.393086	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.361398	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.366076	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.340146	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.346082	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.32338	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.329433	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.3091	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.315938	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.297747	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.304919	valid_1's F1_MACRO: 0.458219
[7]	training's b

[I 2021-03-08 12:35:39,372] Trial 10 finished with value: 0.8077621635953864 and parameters: {'n_estimators': 500, 'lambda_l1': 9.471699202243148, 'lambda_l2': 1.2009314899333601e-08, 'max_depth': 8, 'num_leaves': 38}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.39099	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.393402	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.362351	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.366386	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.340136	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.345773	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.321597	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.328887	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.30608	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.314511	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.291898	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.302096	valid_1's F1_MACRO: 0.458219
[7]	training's 

[I 2021-03-08 12:35:43,859] Trial 11 finished with value: 0.8086079457961195 and parameters: {'n_estimators': 450, 'lambda_l1': 1.2261045395595822e-08, 'lambda_l2': 7.533285456879808, 'max_depth': 8, 'num_leaves': 247}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.386523	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389526	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.355952	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.361919	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.331953	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.341276	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.311804	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32522	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.295438	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.311638	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.280433	training's F1_MACRO: 0.566815	valid_1's binary_logloss: 0.299944	valid_1's F1_MACRO: 0.559225
[7]	training's

[I 2021-03-08 12:35:47,517] Trial 12 finished with value: 0.7986079809094524 and parameters: {'n_estimators': 350, 'lambda_l1': 1.0013760692409686e-08, 'lambda_l2': 2.60024355676058, 'max_depth': 11, 'num_leaves': 167}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.381333	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389076	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.347113	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.361011	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.320622	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.340224	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.299323	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.325184	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.280534	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.31093	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.264241	training's F1_MACRO: 0.655865	valid_1's binary_logloss: 0.299008	valid_1's F1_MACRO: 0.633996
[7]	training's

[I 2021-03-08 12:35:52,358] Trial 13 finished with value: 0.788271832071769 and parameters: {'n_estimators': 450, 'lambda_l1': 8.12308496784239e-08, 'lambda_l2': 0.4195418141542772, 'max_depth': 11, 'num_leaves': 253}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377885	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.385768	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342128	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357355	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.3149	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336416	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292979	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.318825	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.274473	training's F1_MACRO: 0.601866	valid_1's binary_logloss: 0.306423	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.257594	training's F1_MACRO: 0.70349	valid_1's binary_logloss: 0.294785	valid_1's F1_MACRO: 0.664025
[7]	training's b

[I 2021-03-08 12:35:56,706] Trial 14 finished with value: 0.8046156880230484 and parameters: {'n_estimators': 350, 'lambda_l1': 3.195323608580574e-08, 'lambda_l2': 0.00018648742747349648, 'max_depth': 11, 'num_leaves': 172}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.381304	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.388221	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.347452	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360754	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.321677	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.339868	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.300938	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.322473	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.283764	training's F1_MACRO: 0.532829	valid_1's binary_logloss: 0.310027	valid_1's F1_MACRO: 0.504867
[6]	training's binary_logloss: 0.267753	training's F1_MACRO: 0.670327	valid_1's binary_logloss: 0.298133	valid_1's F1_MACRO: 0.646397
[7]	training's binary_logloss: 0.254063	training's F1_MACRO: 0.723284	valid_1

[I 2021-03-08 12:36:01,731] Trial 15 finished with value: 0.8042493152596779 and parameters: {'n_estimators': 500, 'lambda_l1': 0.07145503397467905, 'lambda_l2': 0.24658031542636139, 'max_depth': 8, 'num_leaves': 256}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377913	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.385768	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342249	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357403	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.31514	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336519	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.293219	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.318958	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.274758	training's F1_MACRO: 0.598179	valid_1's binary_logloss: 0.306583	valid_1's F1_MACRO: 0.567147
[6]	training's binary_logloss: 0.257926	training's F1_MACRO: 0.702754	valid_1's binary_logloss: 0.294747	valid_1's F1_MACRO: 0.664025
[7]	training's

[I 2021-03-08 12:36:06,923] Trial 16 finished with value: 0.8100015491329731 and parameters: {'n_estimators': 450, 'lambda_l1': 3.9371200529717024e-05, 'lambda_l2': 0.0019675209117817716, 'max_depth': 11, 'num_leaves': 100}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377306	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386137	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341565	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35788	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314119	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336507	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292109	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320486	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273577	training's F1_MACRO: 0.590719	valid_1's binary_logloss: 0.307154	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.256845	training's F1_MACRO: 0.697307	valid_1's binary_logloss: 0.295392	valid_1's F1_MACRO: 0.653363
[7]	training's

[I 2021-03-08 12:36:12,031] Trial 17 finished with value: 0.7957248274749901 and parameters: {'n_estimators': 350, 'lambda_l1': 9.410070458105057e-07, 'lambda_l2': 2.456925513399731e-05, 'max_depth': 14, 'num_leaves': 183}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.391978	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.394331	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.363972	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.367656	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.342044	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.347525	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.32407	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.330769	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.30872	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.316672	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.294859	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.304643	valid_1's F1_MACRO: 0.458219
[7]	training's 

[I 2021-03-08 12:36:16,728] Trial 18 finished with value: 0.8105430787449364 and parameters: {'n_estimators': 400, 'lambda_l1': 1.278535014544274e-05, 'lambda_l2': 9.693557882425107, 'max_depth': 11, 'num_leaves': 193}. Best is trial 7 with value: 0.8197518825622048.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377142	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386215	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341296	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357616	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314118	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336571	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292065	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320018	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273443	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305599	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256578	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.29418	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:36:22,715] Trial 19 finished with value: 0.8204229930775999 and parameters: {'n_estimators': 400, 'lambda_l1': 0.0005370925926025783, 'lambda_l2': 6.041042048136747e-08, 'max_depth': 17, 'num_leaves': 135}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377751	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386096	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.34246	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357899	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.315426	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.337193	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.293296	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320618	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.274964	training's F1_MACRO: 0.585818	valid_1's binary_logloss: 0.30817	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.259101	training's F1_MACRO: 0.696045	valid_1's binary_logloss: 0.297168	valid_1's F1_MACRO: 0.661863
[7]	training's 

[I 2021-03-08 12:36:26,312] Trial 20 finished with value: 0.8025320075674249 and parameters: {'n_estimators': 450, 'lambda_l1': 0.06798181056470698, 'lambda_l2': 4.694141125982079e-08, 'max_depth': 17, 'num_leaves': 86}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377143	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386189	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341298	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357592	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314119	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33655	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292066	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320003	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273444	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305587	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256672	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.294403	valid_1's F1_MACRO: 0.658751
[7]	training's 

[I 2021-03-08 12:36:30,489] Trial 21 finished with value: 0.7980331427791445 and parameters: {'n_estimators': 400, 'lambda_l1': 0.0009189393734438107, 'lambda_l2': 1.2753524031938233e-07, 'max_depth': 17, 'num_leaves': 133}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377307	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386153	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341566	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357896	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314122	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336521	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292112	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320501	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273581	training's F1_MACRO: 0.590719	valid_1's binary_logloss: 0.307167	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.256806	training's F1_MACRO: 0.697307	valid_1's binary_logloss: 0.295378	valid_1's F1_MACRO: 0.653363
[7]	training'

[I 2021-03-08 12:36:34,812] Trial 22 finished with value: 0.8037845517954016 and parameters: {'n_estimators': 350, 'lambda_l1': 0.0002515895460434268, 'lambda_l2': 1.792704793652352e-07, 'max_depth': 14, 'num_leaves': 148}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.378009	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386124	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.343293	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.358373	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.316831	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.337632	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.295321	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.321449	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.277577	training's F1_MACRO: 0.572362	valid_1's binary_logloss: 0.307348	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.261489	training's F1_MACRO: 0.703121	valid_1's binary_logloss: 0.296484	valid_1's F1_MACRO: 0.646971
[7]	training's binary_logloss: 0.247674	training's F1_MACRO: 0.75834	valid_1'

[I 2021-03-08 12:36:38,295] Trial 23 finished with value: 0.8037845517954016 and parameters: {'n_estimators': 400, 'lambda_l1': 0.01599899366208743, 'lambda_l2': 1.2193861076081818e-08, 'max_depth': 17, 'num_leaves': 66}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.383826	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389002	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.352834	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360499	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.329129	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.339015	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.310216	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.322149	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.294222	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.308525	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.279709	training's F1_MACRO: 0.634851	valid_1's binary_logloss: 0.29694	valid_1's F1_MACRO: 0.633139
[7]	training's

[I 2021-03-08 12:36:42,121] Trial 24 finished with value: 0.8138649520526757 and parameters: {'n_estimators': 400, 'lambda_l1': 1.7608305328348748, 'lambda_l2': 1.0884563765857768e-05, 'max_depth': 8, 'num_leaves': 236}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377752	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386229	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342188	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357985	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314678	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.337114	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292377	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.321104	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27393	training's F1_MACRO: 0.578347	valid_1's binary_logloss: 0.308221	valid_1's F1_MACRO: 0.543557
[6]	training's binary_logloss: 0.257088	training's F1_MACRO: 0.692559	valid_1's binary_logloss: 0.296476	valid_1's F1_MACRO: 0.637215
[7]	training's

[I 2021-03-08 12:36:45,378] Trial 25 finished with value: 0.7915823301729341 and parameters: {'n_estimators': 450, 'lambda_l1': 1.3294965151413686e-07, 'lambda_l2': 0.034582395074839886, 'max_depth': 14, 'num_leaves': 199}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377885	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.385764	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342128	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357351	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314911	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336444	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29299	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.31885	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.274714	training's F1_MACRO: 0.601866	valid_1's binary_logloss: 0.306167	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.257809	training's F1_MACRO: 0.70349	valid_1's binary_logloss: 0.294546	valid_1's F1_MACRO: 0.664025
[7]	training's b

[I 2021-03-08 12:36:49,734] Trial 26 finished with value: 0.8102724132516879 and parameters: {'n_estimators': 350, 'lambda_l1': 1.9087038161653488e-06, 'lambda_l2': 0.00019385372904472887, 'max_depth': 11, 'num_leaves': 149}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377203	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386196	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.34143	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357624	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314328	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336602	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292281	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320061	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273737	training's F1_MACRO: 0.590719	valid_1's binary_logloss: 0.305665	valid_1's F1_MACRO: 0.562567
[6]	training's binary_logloss: 0.25694	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294281	valid_1's F1_MACRO: 0.656527
[7]	training's 

[I 2021-03-08 12:36:53,431] Trial 27 finished with value: 0.7978930316994833 and parameters: {'n_estimators': 400, 'lambda_l1': 8.714703304233093e-05, 'lambda_l2': 1.0974634546594264e-07, 'max_depth': 23, 'num_leaves': 105}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.386492	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389639	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.357651	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.362509	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.335821	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.34156	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.31843	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.324744	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.303097	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.311167	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.290765	training's F1_MACRO: 0.560582	valid_1's binary_logloss: 0.299784	valid_1's F1_MACRO: 0.554609
[7]	training's 

[I 2021-03-08 12:36:55,533] Trial 28 finished with value: 0.8025320075674249 and parameters: {'n_estimators': 450, 'lambda_l1': 0.0008639639778507427, 'lambda_l2': 0.000914225545209549, 'max_depth': 14, 'num_leaves': 9}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357682	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314113	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336964	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29206	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320347	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273412	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.30582	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256582	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.294659	valid_1's F1_MACRO: 0.646087
[7]	training's b

[I 2021-03-08 12:36:59,860] Trial 29 finished with value: 0.7977122616384362 and parameters: {'n_estimators': 350, 'lambda_l1': 4.133868202246413e-07, 'lambda_l2': 1.267163187708812e-06, 'max_depth': 17, 'num_leaves': 232}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.377883	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.385762	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342125	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357348	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314908	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336441	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292987	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.318847	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.274711	training's F1_MACRO: 0.601866	valid_1's binary_logloss: 0.306165	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.257806	training's F1_MACRO: 0.70349	valid_1's binary_logloss: 0.294544	valid_1's F1_MACRO: 0.664025
[7]	training's binary_logloss: 0.243066	training's F1_MACRO: 0.757441	valid_1'

[I 2021-03-08 12:37:03,341] Trial 30 finished with value: 0.8102724132516879 and parameters: {'n_estimators': 400, 'lambda_l1': 1.2495981970706537e-05, 'lambda_l2': 5.057284670080416e-07, 'max_depth': 11, 'num_leaves': 199}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.389126	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.392252	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.360735	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.364959	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.339368	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.344701	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.321915	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.328559	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.308034	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.315082	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.296144	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.303942	valid_1's F1_MACRO: 0.458219
[7]	training'

[I 2021-03-08 12:37:09,530] Trial 31 finished with value: 0.8122001569438748 and parameters: {'n_estimators': 400, 'lambda_l1': 8.455730054977042, 'lambda_l2': 8.016117816042623e-06, 'max_depth': 8, 'num_leaves': 237}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.383469	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.388914	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.35265	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360734	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.328145	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33961	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.309177	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.322842	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.293204	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.309023	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.278465	training's F1_MACRO: 0.636974	valid_1's binary_logloss: 0.297283	valid_1's F1_MACRO: 0.616829
[7]	training's binary_logloss: 0.265993	training's F1_MACRO: 0.71661	valid_1's 

[I 2021-03-08 12:37:14,484] Trial 32 finished with value: 0.8127531937550225 and parameters: {'n_estimators': 400, 'lambda_l1': 1.5716613128415478, 'lambda_l2': 3.4961596999169914e-05, 'max_depth': 8, 'num_leaves': 236}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.380258	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386929	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.346173	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.3597	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.320696	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.339581	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.299963	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.324298	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.282721	training's F1_MACRO: 0.574937	valid_1's binary_logloss: 0.311273	valid_1's F1_MACRO: 0.551174
[6]	training's binary_logloss: 0.267028	training's F1_MACRO: 0.683458	valid_1's binary_logloss: 0.299217	valid_1's F1_MACRO: 0.650674
[7]	training's 

[I 2021-03-08 12:37:18,706] Trial 33 finished with value: 0.798226217267668 and parameters: {'n_estimators': 400, 'lambda_l1': 0.4302093128584469, 'lambda_l2': 4.882404679782239e-06, 'max_depth': 8, 'num_leaves': 216}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377883	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.385762	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342126	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357427	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314905	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336578	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292969	training's F1_MACRO: 0.459373	valid_1's binary_logloss: 0.319101	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27469	training's F1_MACRO: 0.601866	valid_1's binary_logloss: 0.306292	valid_1's F1_MACRO: 0.574269
[6]	training's binary_logloss: 0.257785	training's F1_MACRO: 0.700058	valid_1's binary_logloss: 0.294666	valid_1's F1_MACRO: 0.660942
[7]	training's

[I 2021-03-08 12:37:23,743] Trial 34 finished with value: 0.8001653746770025 and parameters: {'n_estimators': 300, 'lambda_l1': 1.7744996848087621e-06, 'lambda_l2': 3.925595372407288e-07, 'max_depth': 11, 'num_leaves': 229}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377306	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386141	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341566	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357935	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314123	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336563	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292191	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320432	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273697	training's F1_MACRO: 0.587892	valid_1's binary_logloss: 0.30749	valid_1's F1_MACRO: 0.570399
[6]	training's binary_logloss: 0.256735	training's F1_MACRO: 0.696332	valid_1's binary_logloss: 0.29605	valid_1's F1_MACRO: 0.664954
[7]	training's 

[I 2021-03-08 12:37:29,444] Trial 35 finished with value: 0.7990971781933142 and parameters: {'n_estimators': 400, 'lambda_l1': 3.468356618286938e-08, 'lambda_l2': 1.0148014607254337e-08, 'max_depth': 14, 'num_leaves': 211}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.379365	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386818	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.345088	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.358287	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.31861	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.337207	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.297113	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319902	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.279796	training's F1_MACRO: 0.573504	valid_1's binary_logloss: 0.306379	valid_1's F1_MACRO: 0.541872
[6]	training's binary_logloss: 0.263761	training's F1_MACRO: 0.691307	valid_1's binary_logloss: 0.294933	valid_1's F1_MACRO: 0.660592
[7]	training's

[I 2021-03-08 12:37:35,086] Trial 36 finished with value: 0.8023143873375257 and parameters: {'n_estimators': 450, 'lambda_l1': 4.438055679108835e-06, 'lambda_l2': 0.018670287175051734, 'max_depth': 8, 'num_leaves': 156}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377153	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386196	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341313	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357604	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314137	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336584	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292086	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320036	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273466	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305626	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256697	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.29444	valid_1's F1_MACRO: 0.658751
[7]	training's 

[I 2021-03-08 12:37:40,146] Trial 37 finished with value: 0.803619203206487 and parameters: {'n_estimators': 350, 'lambda_l1': 0.003781965361968245, 'lambda_l2': 4.5044767465894034e-08, 'max_depth': 17, 'num_leaves': 184}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357667	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314111	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336951	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292058	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320335	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27341	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.305808	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256624	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.294676	valid_1's F1_MACRO: 0.646087
[7]	training's 

[I 2021-03-08 12:37:44,467] Trial 38 finished with value: 0.8033952726380711 and parameters: {'n_estimators': 400, 'lambda_l1': 3.652619502791155e-07, 'lambda_l2': 2.177596632652566e-06, 'max_depth': 20, 'num_leaves': 252}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.378053	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.385909	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342606	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357678	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.315509	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336858	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.293523	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319974	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.275154	training's F1_MACRO: 0.587892	valid_1's binary_logloss: 0.306867	valid_1's F1_MACRO: 0.563202
[6]	training's binary_logloss: 0.258273	training's F1_MACRO: 0.693567	valid_1's binary_logloss: 0.295447	valid_1's F1_MACRO: 0.669191
[7]	training'

[I 2021-03-08 12:37:50,580] Trial 39 finished with value: 0.8014491465246933 and parameters: {'n_estimators': 400, 'lambda_l1': 0.03803945538082402, 'lambda_l2': 0.0005212956482258459, 'max_depth': 11, 'num_leaves': 125}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.378145	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.387244	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.344121	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.359409	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.317861	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.338655	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.296844	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32264	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.278877	training's F1_MACRO: 0.546212	valid_1's binary_logloss: 0.310315	valid_1's F1_MACRO: 0.551174
[6]	training's binary_logloss: 0.263643	training's F1_MACRO: 0.684484	valid_1's binary_logloss: 0.30028	valid_1's F1_MACRO: 0.658751
[7]	training's 

[I 2021-03-08 12:37:57,714] Trial 40 finished with value: 0.7944852126579516 and parameters: {'n_estimators': 450, 'lambda_l1': 0.43655420559784835, 'lambda_l2': 1.3338972327217739e-05, 'max_depth': 14, 'num_leaves': 217}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386214	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357614	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314116	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336568	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292062	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320013	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273439	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305597	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256574	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294177	valid_1's F1_MACRO: 0.656527
[7]	training's binary_logloss: 0.241933	training's F1_MACRO: 0.754337	valid_1

[I 2021-03-08 12:38:01,488] Trial 41 finished with value: 0.7986079809094524 and parameters: {'n_estimators': 400, 'lambda_l1': 9.926120040843689e-05, 'lambda_l2': 3.675313776814178e-05, 'max_depth': 23, 'num_leaves': 242}. Best is trial 19 with value: 0.8204229930775999.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386187	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35759	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336547	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319998	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273437	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305583	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256615	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294193	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:38:08,522] Trial 42 finished with value: 0.8212005983952129 and parameters: {'n_estimators': 400, 'lambda_l1': 8.379812902948931e-07, 'lambda_l2': 9.52501649951279e-05, 'max_depth': 20, 'num_leaves': 208}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386203	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357604	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314116	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33656	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292062	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320009	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273439	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305594	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256573	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294175	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:38:12,356] Trial 43 finished with value: 0.8025320075674249 and parameters: {'n_estimators': 400, 'lambda_l1': 6.818478732964152e-07, 'lambda_l2': 7.792122582560476e-05, 'max_depth': 20, 'num_leaves': 226}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377258	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.38629	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341438	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357708	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314318	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.337029	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292265	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320119	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273618	training's F1_MACRO: 0.580271	valid_1's binary_logloss: 0.305806	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256783	training's F1_MACRO: 0.695815	valid_1's binary_logloss: 0.294392	valid_1's F1_MACRO: 0.650178
[7]	training's

[I 2021-03-08 12:38:17,269] Trial 44 finished with value: 0.8010252443676016 and parameters: {'n_estimators': 400, 'lambda_l1': 1.3225801944150969e-07, 'lambda_l2': 0.009936078281451011, 'max_depth': 20, 'num_leaves': 207}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377157	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386199	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341314	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357604	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314135	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336561	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292081	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320013	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273458	training's F1_MACRO: 0.587892	valid_1's binary_logloss: 0.305597	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256686	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.294411	valid_1's F1_MACRO: 0.658751
[7]	training's

[I 2021-03-08 12:38:22,990] Trial 45 finished with value: 0.8086511846722455 and parameters: {'n_estimators': 350, 'lambda_l1': 8.580671901674502e-06, 'lambda_l2': 0.0014038956288724097, 'max_depth': 20, 'num_leaves': 178}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.379174	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.387987	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.344574	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360457	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.317349	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.34095	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.295067	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.324995	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27685	training's F1_MACRO: 0.563354	valid_1's binary_logloss: 0.312445	valid_1's F1_MACRO: 0.551769
[6]	training's binary_logloss: 0.259683	training's F1_MACRO: 0.682443	valid_1's binary_logloss: 0.300953	valid_1's F1_MACRO: 0.646087
[7]	training's 

[I 2021-03-08 12:38:27,163] Trial 46 finished with value: 0.7914405491417731 and parameters: {'n_estimators': 400, 'lambda_l1': 4.8874514317094556e-08, 'lambda_l2': 0.24017956059609433, 'max_depth': 23, 'num_leaves': 191}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.383918	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389287	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.351793	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.361857	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.32666	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.341246	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.306154	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.323838	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.289128	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.309983	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.273914	training's F1_MACRO: 0.6156	valid_1's binary_logloss: 0.29776	valid_1's F1_MACRO: 0.616022
[7]	training's bi

[I 2021-03-08 12:38:33,685] Trial 47 finished with value: 0.8174048921209207 and parameters: {'n_estimators': 450, 'lambda_l1': 1.6844985668267873e-08, 'lambda_l2': 1.2168850449121744, 'max_depth': 17, 'num_leaves': 222}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.385135	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.390018	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.353306	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.36243	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.328098	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.340987	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.308006	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.324319	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.290876	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.311045	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.275676	training's F1_MACRO: 0.600336	valid_1's binary_logloss: 0.298634	valid_1's F1_MACRO: 0.600533
[7]	training's

[I 2021-03-08 12:38:39,127] Trial 48 finished with value: 0.803619203206487 and parameters: {'n_estimators': 500, 'lambda_l1': 1.0426945596077343e-08, 'lambda_l2': 1.55552419318833, 'max_depth': 17, 'num_leaves': 163}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.383155	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.388858	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.350304	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360556	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.324902	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.339081	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.30306	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.321945	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.285368	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.307908	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.269149	training's F1_MACRO: 0.632953	valid_1's binary_logloss: 0.296508	valid_1's F1_MACRO: 0.637356
[7]	training's

[I 2021-03-08 12:38:43,645] Trial 49 finished with value: 0.8033952726380711 and parameters: {'n_estimators': 450, 'lambda_l1': 1.8502106910400736e-08, 'lambda_l2': 0.8310147422416555, 'max_depth': 17, 'num_leaves': 140}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.378559	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.387216	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.343759	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360236	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.316706	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.34038	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.295097	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.323594	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.276445	training's F1_MACRO: 0.557217	valid_1's binary_logloss: 0.310969	valid_1's F1_MACRO: 0.551174
[6]	training's binary_logloss: 0.260554	training's F1_MACRO: 0.676806	valid_1's binary_logloss: 0.30051	valid_1's F1_MACRO: 0.646087
[7]	training's 

[I 2021-03-08 12:38:47,657] Trial 50 finished with value: 0.7932600844674886 and parameters: {'n_estimators': 500, 'lambda_l1': 4.4022699659966316e-05, 'lambda_l2': 0.18139995483629448, 'max_depth': 20, 'num_leaves': 220}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.387951	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.39012	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.357692	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.363251	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.334057	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.341443	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.314545	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.324272	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.298432	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.310711	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.283695	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.298671	valid_1's F1_MACRO: 0.458219
[7]	training's

[I 2021-03-08 12:38:53,394] Trial 51 finished with value: 0.8055699766817721 and parameters: {'n_estimators': 450, 'lambda_l1': 1.5331123621043337e-07, 'lambda_l2': 3.2957663773053456, 'max_depth': 17, 'num_leaves': 243}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377194	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386228	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341359	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357638	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314183	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336595	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292129	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320046	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273505	training's F1_MACRO: 0.585998	valid_1's binary_logloss: 0.305627	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256733	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.294434	valid_1's F1_MACRO: 0.658751
[7]	training's

[I 2021-03-08 12:38:57,672] Trial 52 finished with value: 0.8118331870450938 and parameters: {'n_estimators': 400, 'lambda_l1': 1.4017020928455198e-06, 'lambda_l2': 0.004495466241508117, 'max_depth': 17, 'num_leaves': 203}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37839	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386879	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.343283	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.358954	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.316082	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33801	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.293878	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.321715	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27532	training's F1_MACRO: 0.57253	valid_1's binary_logloss: 0.308694	valid_1's F1_MACRO: 0.542431
[6]	training's binary_logloss: 0.258755	training's F1_MACRO: 0.691052	valid_1's binary_logloss: 0.297192	valid_1's F1_MACRO: 0.655617
[7]	training's bi

[I 2021-03-08 12:39:04,570] Trial 53 finished with value: 0.8025320075674249 and parameters: {'n_estimators': 350, 'lambda_l1': 2.7554420311290504e-07, 'lambda_l2': 0.07498846614358642, 'max_depth': 14, 'num_leaves': 250}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377148	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386181	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341308	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357583	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314142	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336561	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292087	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320011	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273477	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305604	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256656	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294223	valid_1's F1_MACRO: 0.656527
[7]	training'

[I 2021-03-08 12:39:08,585] Trial 54 finished with value: 0.8061754385964912 and parameters: {'n_estimators': 450, 'lambda_l1': 5.6806642827107634e-08, 'lambda_l2': 0.00010313668327817212, 'max_depth': 20, 'num_leaves': 110}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377306	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386125	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341565	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357921	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314122	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336549	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29219	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32042	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273695	training's F1_MACRO: 0.587892	valid_1's binary_logloss: 0.307479	valid_1's F1_MACRO: 0.570399
[6]	training's binary_logloss: 0.256777	training's F1_MACRO: 0.696332	valid_1's binary_logloss: 0.296067	valid_1's F1_MACRO: 0.664954
[7]	training's 

[I 2021-03-08 12:39:13,037] Trial 55 finished with value: 0.798226217267668 and parameters: {'n_estimators': 400, 'lambda_l1': 3.856396010949237e-06, 'lambda_l2': 2.9689667215321936e-08, 'max_depth': 14, 'num_leaves': 256}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.379171	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386672	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.34492	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.358325	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.318576	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.337268	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.297373	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320724	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.279547	training's F1_MACRO: 0.562679	valid_1's binary_logloss: 0.307452	valid_1's F1_MACRO: 0.562567
[6]	training's binary_logloss: 0.263516	training's F1_MACRO: 0.695815	valid_1's binary_logloss: 0.29573	valid_1's F1_MACRO: 0.660592
[7]	training's 

[I 2021-03-08 12:39:16,636] Trial 56 finished with value: 0.8110913765101313 and parameters: {'n_estimators': 350, 'lambda_l1': 9.62754905830108e-07, 'lambda_l2': 0.00038427287826762536, 'max_depth': 8, 'num_leaves': 78}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.389782	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.391983	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.360692	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.364996	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.337709	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.344281	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.318859	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.326913	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.303369	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.31272	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.288972	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.300499	valid_1's F1_MACRO: 0.458219
[7]	training's

[I 2021-03-08 12:39:21,621] Trial 57 finished with value: 0.8016593751380972 and parameters: {'n_estimators': 450, 'lambda_l1': 1.6390696463598433e-08, 'lambda_l2': 5.605821615735379, 'max_depth': 11, 'num_leaves': 223}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386187	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35759	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314116	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336546	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292062	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319998	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273439	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305581	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256618	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294192	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:39:27,038] Trial 58 finished with value: 0.8072608642556829 and parameters: {'n_estimators': 400, 'lambda_l1': 0.0003314729979408975, 'lambda_l2': 2.2719060404994207e-07, 'max_depth': 17, 'num_leaves': 189}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.382288	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389104	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.3483	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.36161	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.322269	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.339212	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.301148	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.322412	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.283151	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.308684	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.266822	training's F1_MACRO: 0.650368	valid_1's binary_logloss: 0.297167	valid_1's F1_MACRO: 0.633996
[7]	training's b

[I 2021-03-08 12:39:33,258] Trial 59 finished with value: 0.7962781854241677 and parameters: {'n_estimators': 400, 'lambda_l1': 2.2790640817526285e-05, 'lambda_l2': 0.6239647391279086, 'max_depth': 11, 'num_leaves': 208}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386198	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357599	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336555	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292059	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273436	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305585	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256614	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294193	valid_1's F1_MACRO: 0.656527
[7]	training's bi

[I 2021-03-08 12:39:37,783] Trial 60 finished with value: 0.8121855025159799 and parameters: {'n_estimators': 450, 'lambda_l1': 8.891323323867779e-08, 'lambda_l2': 1.4690088928258928e-05, 'max_depth': 17, 'num_leaves': 231}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377179	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386254	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341349	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357666	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314178	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336647	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292133	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32011	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273516	training's F1_MACRO: 0.587892	valid_1's binary_logloss: 0.305696	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256705	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.29448	valid_1's F1_MACRO: 0.658751
[7]	training's b

[I 2021-03-08 12:39:42,877] Trial 61 finished with value: 0.8102724132516879 and parameters: {'n_estimators': 400, 'lambda_l1': 0.00903888233896224, 'lambda_l2': 6.437069854068676e-05, 'max_depth': 20, 'num_leaves': 173}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377149	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386193	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341306	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357599	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.31413	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336558	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292078	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32001	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273457	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305595	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256686	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.294404	valid_1's F1_MACRO: 0.658751
[7]	training's b

[I 2021-03-08 12:39:47,540] Trial 62 finished with value: 0.7971603427172582 and parameters: {'n_estimators': 400, 'lambda_l1': 0.0025383873834461533, 'lambda_l2': 2.6631932857800922e-06, 'max_depth': 20, 'num_leaves': 199}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377143	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.3862	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341298	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357602	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314118	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336558	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292064	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320004	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273441	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305587	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256621	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294197	valid_1's F1_MACRO: 0.656527
[7]	training's 

[I 2021-03-08 12:39:52,402] Trial 63 finished with value: 0.803619203206487 and parameters: {'n_estimators': 400, 'lambda_l1': 0.0003007845257145316, 'lambda_l2': 0.00017586287221958816, 'max_depth': 23, 'num_leaves': 241}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386198	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357599	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336555	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292059	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320001	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273436	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305585	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256614	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294194	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:39:57,481] Trial 64 finished with value: 0.8124693369778525 and parameters: {'n_estimators': 400, 'lambda_l1': 8.397105446728515e-06, 'lambda_l2': 7.003721267999506e-06, 'max_depth': 20, 'num_leaves': 214}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357682	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314113	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336964	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29206	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320347	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273412	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.30582	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256582	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.294659	valid_1's F1_MACRO: 0.646087
[7]	training's binary_logloss: 0.241872	training's F1_MACRO: 0.7534	valid_1's bi

[I 2021-03-08 12:40:02,431] Trial 65 finished with value: 0.7977122616384362 and parameters: {'n_estimators': 350, 'lambda_l1': 5.414235845580044e-07, 'lambda_l2': 1.0973974355838763e-06, 'max_depth': 17, 'num_leaves': 230}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377143	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386204	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341298	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357606	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.31412	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336563	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292067	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320015	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273445	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305598	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256629	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.294386	valid_1's F1_MACRO: 0.658751
[7]	training's 

[I 2021-03-08 12:40:08,340] Trial 66 finished with value: 0.8027485808115311 and parameters: {'n_estimators': 400, 'lambda_l1': 0.0008771345301364326, 'lambda_l2': 1.4825140607488306e-08, 'max_depth': 20, 'num_leaves': 195}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.387458	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.390296	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.358609	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.363072	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.336682	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.342192	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.31919	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32609	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.304686	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.312401	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.292779	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.300892	valid_1's F1_MACRO: 0.458219
[7]	training's 

[I 2021-03-08 12:40:11,390] Trial 67 finished with value: 0.80317855407436 and parameters: {'n_estimators': 450, 'lambda_l1': 5.622870457318458, 'lambda_l2': 2.0708349444360593e-05, 'max_depth': 8, 'num_leaves': 221}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.377306	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386137	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341565	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357959	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314122	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336585	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29219	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32042	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273696	training's F1_MACRO: 0.587892	valid_1's binary_logloss: 0.307479	valid_1's F1_MACRO: 0.570399
[6]	training's binary_logloss: 0.256778	training's F1_MACRO: 0.696332	valid_1's binary_logloss: 0.296066	valid_1's F1_MACRO: 0.664954
[7]	training's binary_logloss: 0.242042	training's F1_MACRO: 0.749025	valid_1's

[I 2021-03-08 12:40:17,374] Trial 68 finished with value: 0.8029446101958749 and parameters: {'n_estimators': 400, 'lambda_l1': 2.760281285499115e-06, 'lambda_l2': 9.247185695683245e-08, 'max_depth': 14, 'num_leaves': 180}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.378392	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.387593	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.344102	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360083	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.317636	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.338853	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.296048	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32189	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27818	training's F1_MACRO: 0.581485	valid_1's binary_logloss: 0.310096	valid_1's F1_MACRO: 0.574269
[6]	training's binary_logloss: 0.262528	training's F1_MACRO: 0.676806	valid_1's binary_logloss: 0.298879	valid_1's F1_MACRO: 0.650178
[7]	training's 

[I 2021-03-08 12:40:21,885] Trial 69 finished with value: 0.782539254060377 and parameters: {'n_estimators': 350, 'lambda_l1': 0.25015293426756563, 'lambda_l2': 0.08152666284384134, 'max_depth': 17, 'num_leaves': 115}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377148	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386208	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341303	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35761	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314125	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336566	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292071	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320016	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273448	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305597	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256631	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.294386	valid_1's F1_MACRO: 0.658751
[7]	training's 

[I 2021-03-08 12:40:26,385] Trial 70 finished with value: 0.8025320075674249 and parameters: {'n_estimators': 300, 'lambda_l1': 2.3280448698375408e-07, 'lambda_l2': 0.0006448351922340912, 'max_depth': 23, 'num_leaves': 248}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.385956	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389265	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.35623	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.362394	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.333779	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.341607	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.315968	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.324861	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.300798	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.310871	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.287174	training's F1_MACRO: 0.570722	valid_1's binary_logloss: 0.298892	valid_1's F1_MACRO: 0.559225
[7]	training's

[I 2021-03-08 12:40:31,248] Trial 71 finished with value: 0.7998854131369157 and parameters: {'n_estimators': 400, 'lambda_l1': 3.6152431420624294, 'lambda_l2': 5.2917920672940265e-05, 'max_depth': 8, 'num_leaves': 235}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.384387	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.388413	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.353602	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.36035	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.330474	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.339406	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.311734	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.322802	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.296254	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.30938	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.281943	training's F1_MACRO: 0.571861	valid_1's binary_logloss: 0.296457	valid_1's F1_MACRO: 0.574269
[7]	training's 

[I 2021-03-08 12:40:36,013] Trial 72 finished with value: 0.8025320075674249 and parameters: {'n_estimators': 400, 'lambda_l1': 2.103406789349203, 'lambda_l2': 0.0001869418441382629, 'max_depth': 8, 'num_leaves': 46}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.381954	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.387866	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.349252	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360244	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.325059	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.339187	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.304898	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.322915	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.288397	training's F1_MACRO: 0.522174	valid_1's binary_logloss: 0.309416	valid_1's F1_MACRO: 0.504867
[6]	training's binary_logloss: 0.27334	training's F1_MACRO: 0.648554	valid_1's binary_logloss: 0.297769	valid_1's F1_MACRO: 0.646397
[7]	training's

[I 2021-03-08 12:40:43,607] Trial 73 finished with value: 0.7955565866808079 and parameters: {'n_estimators': 400, 'lambda_l1': 0.9035275252246358, 'lambda_l2': 3.187978032119393e-05, 'max_depth': 8, 'num_leaves': 256}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.378514	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386196	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.343331	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35808	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.316459	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33732	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.295071	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320892	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.277026	training's F1_MACRO: 0.587711	valid_1's binary_logloss: 0.308231	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.26103	training's F1_MACRO: 0.68701	valid_1's binary_logloss: 0.297084	valid_1's F1_MACRO: 0.657838
[7]	training's bi

[I 2021-03-08 12:40:50,657] Trial 74 finished with value: 0.7962781854241677 and parameters: {'n_estimators': 400, 'lambda_l1': 0.1373322176120909, 'lambda_l2': 1.0019285269575301e-05, 'max_depth': 11, 'num_leaves': 237}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.379226	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386708	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.345014	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.358196	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.318523	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.337163	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.297485	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32074	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.279572	training's F1_MACRO: 0.564665	valid_1's binary_logloss: 0.308181	valid_1's F1_MACRO: 0.546523
[6]	training's binary_logloss: 0.262982	training's F1_MACRO: 0.686754	valid_1's binary_logloss: 0.296498	valid_1's F1_MACRO: 0.666828
[7]	training's

[I 2021-03-08 12:40:54,585] Trial 75 finished with value: 0.793418100224383 and parameters: {'n_estimators': 400, 'lambda_l1': 0.022177359859249096, 'lambda_l2': 4.758611288109284e-06, 'max_depth': 8, 'num_leaves': 210}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.382715	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.388726	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.350953	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.360605	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.326016	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.339806	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.306484	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32301	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.289895	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.309859	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.275093	training's F1_MACRO: 0.650506	valid_1's binary_logloss: 0.298124	valid_1's F1_MACRO: 0.647291
[7]	training's

[I 2021-03-08 12:40:57,171] Trial 76 finished with value: 0.8077621635953864 and parameters: {'n_estimators': 400, 'lambda_l1': 1.226889233925697, 'lambda_l2': 0.0003065768097145052, 'max_depth': 8, 'num_leaves': 226}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377967	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.385764	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342343	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357379	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.315311	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336448	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.293049	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320154	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.274813	training's F1_MACRO: 0.592595	valid_1's binary_logloss: 0.306233	valid_1's F1_MACRO: 0.557986
[6]	training's binary_logloss: 0.258107	training's F1_MACRO: 0.694575	valid_1's binary_logloss: 0.294413	valid_1's F1_MACRO: 0.65427
[7]	training's

[I 2021-03-08 12:40:59,514] Trial 77 finished with value: 0.8055699766817721 and parameters: {'n_estimators': 400, 'lambda_l1': 9.447996066270856e-05, 'lambda_l2': 0.00011143315805722172, 'max_depth': 11, 'num_leaves': 92}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377306	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386153	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341565	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357895	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314121	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33652	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292111	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320498	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273579	training's F1_MACRO: 0.590719	valid_1's binary_logloss: 0.307165	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.256803	training's F1_MACRO: 0.697307	valid_1's binary_logloss: 0.295374	valid_1's F1_MACRO: 0.653363
[7]	training's

[I 2021-03-08 12:41:01,492] Trial 78 finished with value: 0.8033952726380711 and parameters: {'n_estimators': 400, 'lambda_l1': 9.515005492337354e-07, 'lambda_l2': 4.680003545718029e-05, 'max_depth': 14, 'num_leaves': 215}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386198	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357599	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336555	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29206	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273436	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305585	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256614	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294193	valid_1's F1_MACRO: 0.656527
[7]	training's bin

[I 2021-03-08 12:41:04,822] Trial 79 finished with value: 0.8075117680048554 and parameters: {'n_estimators': 450, 'lambda_l1': 3.0637633980042496e-08, 'lambda_l2': 2.1806753705771922e-05, 'max_depth': 20, 'num_leaves': 205}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377917	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.385778	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.342168	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357371	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314955	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336467	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.293033	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.318877	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.274758	training's F1_MACRO: 0.600947	valid_1's binary_logloss: 0.306193	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.257873	training's F1_MACRO: 0.702754	valid_1's binary_logloss: 0.294389	valid_1's F1_MACRO: 0.664025
[7]	training'

[I 2021-03-08 12:41:06,606] Trial 80 finished with value: 0.8064199607513316 and parameters: {'n_estimators': 400, 'lambda_l1': 2.6549366461740686e-05, 'lambda_l2': 0.0030478812442399344, 'max_depth': 11, 'num_leaves': 186}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357603	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336559	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320009	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273438	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305593	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256571	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294173	valid_1's F1_MACRO: 0.656527
[7]	training's binary_logloss: 0.24193	training's F1_MACRO: 0.754337	valid_1's

[I 2021-03-08 12:41:12,346] Trial 81 finished with value: 0.8151905344757242 and parameters: {'n_estimators': 400, 'lambda_l1': 7.551790244674792e-06, 'lambda_l2': 9.367563317331578e-06, 'max_depth': 20, 'num_leaves': 213}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357571	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336529	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320012	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273437	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305596	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256571	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294176	valid_1's F1_MACRO: 0.656527
[7]	training's binary_logloss: 0.241929	training's F1_MACRO: 0.754337	valid_1'

[I 2021-03-08 12:41:14,882] Trial 82 finished with value: 0.8151905344757242 and parameters: {'n_estimators': 400, 'lambda_l1': 7.559034723737904e-06, 'lambda_l2': 1.6412674932614022e-06, 'max_depth': 20, 'num_leaves': 242}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35764	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314112	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336926	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292058	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320331	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27341	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.305805	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256624	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.294674	valid_1's F1_MACRO: 0.646087
[7]	training's b

[I 2021-03-08 12:41:19,006] Trial 83 finished with value: 0.7941553107575139 and parameters: {'n_estimators': 400, 'lambda_l1': 2.5016745233536207e-06, 'lambda_l2': 1.8310074938277586e-06, 'max_depth': 20, 'num_leaves': 223}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357603	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336559	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320009	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273437	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305593	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256571	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294173	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:41:21,356] Trial 84 finished with value: 0.8162955112436978 and parameters: {'n_estimators': 400, 'lambda_l1': 7.63362169043262e-06, 'lambda_l2': 4.278524102732763e-06, 'max_depth': 20, 'num_leaves': 245}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357603	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336559	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320009	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273437	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305593	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256571	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294173	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:41:23,538] Trial 85 finished with value: 0.8121855025159799 and parameters: {'n_estimators': 400, 'lambda_l1': 1.0727879929744043e-05, 'lambda_l2': 3.857068292364813e-06, 'max_depth': 20, 'num_leaves': 244}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341293	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357561	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33652	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292059	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319999	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273435	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305584	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256613	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294193	valid_1's F1_MACRO: 0.656527
[7]	training's 

[I 2021-03-08 12:41:25,266] Trial 86 finished with value: 0.8119016733687897 and parameters: {'n_estimators': 400, 'lambda_l1': 6.348136659712369e-06, 'lambda_l2': 5.801358410731363e-07, 'max_depth': 20, 'num_leaves': 250}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357588	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336545	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292059	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319995	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273436	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.30558	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256614	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.29419	valid_1's F1_MACRO: 0.656527
[7]	training's 

[I 2021-03-08 12:41:27,330] Trial 87 finished with value: 0.7964560693387301 and parameters: {'n_estimators': 400, 'lambda_l1': 1.8620471744579813e-05, 'lambda_l2': 7.376366179426631e-06, 'max_depth': 20, 'num_leaves': 238}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35759	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336546	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29206	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319997	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273436	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305582	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256614	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294192	valid_1's F1_MACRO: 0.656527
[7]	training's 

[I 2021-03-08 12:41:30,158] Trial 88 finished with value: 0.8143867911642417 and parameters: {'n_estimators': 400, 'lambda_l1': 5.5279878758198435e-05, 'lambda_l2': 9.354912072748612e-07, 'max_depth': 23, 'num_leaves': 232}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357603	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336559	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320009	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273438	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305593	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256572	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294174	valid_1's F1_MACRO: 0.656527
[7]	training'

[I 2021-03-08 12:41:31,668] Trial 89 finished with value: 0.7987966345806293 and parameters: {'n_estimators': 350, 'lambda_l1': 4.5349296480389503e-05, 'lambda_l2': 2.612107830875909e-07, 'max_depth': 23, 'num_leaves': 229}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357604	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314116	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336559	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292062	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320009	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273439	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305593	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256574	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294174	valid_1's F1_MACRO: 0.656527
[7]	training'

[I 2021-03-08 12:41:33,499] Trial 90 finished with value: 0.7984178357846123 and parameters: {'n_estimators': 400, 'lambda_l1': 0.00017406137834660433, 'lambda_l2': 5.24564757376984e-08, 'max_depth': 23, 'num_leaves': 256}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35764	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314112	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336925	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292058	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320338	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27341	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.305811	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256624	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.294679	valid_1's F1_MACRO: 0.646087
[7]	training's b

[I 2021-03-08 12:41:35,627] Trial 91 finished with value: 0.7941553107575139 and parameters: {'n_estimators': 400, 'lambda_l1': 4.877313516748259e-06, 'lambda_l2': 7.753023043799042e-07, 'max_depth': 17, 'num_leaves': 247}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357671	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314111	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336954	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292058	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320334	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27341	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.305808	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256625	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.294676	valid_1's F1_MACRO: 0.646087
[7]	training's 

[I 2021-03-08 12:41:37,726] Trial 92 finished with value: 0.7953865250445313 and parameters: {'n_estimators': 400, 'lambda_l1': 1.3347672649135726e-06, 'lambda_l2': 1.5592562129538131e-06, 'max_depth': 23, 'num_leaves': 219}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357603	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336559	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320009	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273438	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305593	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256572	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294174	valid_1's F1_MACRO: 0.656527
[7]	training'

[I 2021-03-08 12:41:40,302] Trial 93 finished with value: 0.8058067423493368 and parameters: {'n_estimators': 400, 'lambda_l1': 6.094850290529186e-05, 'lambda_l2': 3.491314642348565e-06, 'max_depth': 20, 'num_leaves': 234}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357588	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336545	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292059	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319996	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273435	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305581	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256614	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.29419	valid_1's F1_MACRO: 0.656527
[7]	training's 

[I 2021-03-08 12:41:42,226] Trial 94 finished with value: 0.8113686902075627 and parameters: {'n_estimators': 400, 'lambda_l1': 1.7015580593544035e-05, 'lambda_l2': 3.695798650247408e-07, 'max_depth': 17, 'num_leaves': 200}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386198	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357678	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314111	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336961	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292058	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320339	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27341	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.305812	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256625	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.29468	valid_1's F1_MACRO: 0.646087
[7]	training's b

[I 2021-03-08 12:41:45,778] Trial 95 finished with value: 0.807009447544516 and parameters: {'n_estimators': 400, 'lambda_l1': 4.990405356038471e-07, 'lambda_l2': 1.03996140137841e-06, 'max_depth': 20, 'num_leaves': 241}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.377142	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386215	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341296	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357616	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314118	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336571	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292065	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320018	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273443	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305599	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256578	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294181	valid_1's F1_MACRO: 0.656527
[7]	training's binary_logloss: 0.241937	training's F1_MACRO: 0.754337	valid_1

[I 2021-03-08 12:41:48,263] Trial 96 finished with value: 0.815797857271201 and parameters: {'n_estimators': 500, 'lambda_l1': 0.0005028959632686787, 'lambda_l2': 1.3566565493269724e-05, 'max_depth': 17, 'num_leaves': 225}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377143	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386204	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341297	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357606	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314119	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336562	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292066	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320014	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273444	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305597	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256578	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294179	valid_1's F1_MACRO: 0.656527
[7]	training'

[I 2021-03-08 12:41:50,544] Trial 97 finished with value: 0.8072608642556829 and parameters: {'n_estimators': 500, 'lambda_l1': 0.0006532204673800179, 'lambda_l2': 6.188664853894557e-06, 'max_depth': 17, 'num_leaves': 214}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357604	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314116	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336559	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292062	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320009	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27344	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305591	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256574	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294174	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:41:52,577] Trial 98 finished with value: 0.803619203206487 and parameters: {'n_estimators': 500, 'lambda_l1': 0.00021474342185871082, 'lambda_l2': 1.7176444859076257e-08, 'max_depth': 17, 'num_leaves': 195}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35759	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336546	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29206	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319997	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273436	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305582	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256615	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294192	valid_1's F1_MACRO: 0.656527
[7]	training's 

[I 2021-03-08 12:41:54,843] Trial 99 finished with value: 0.8159857523098872 and parameters: {'n_estimators': 450, 'lambda_l1': 6.530135294657251e-05, 'lambda_l2': 1.541190261000996e-05, 'max_depth': 17, 'num_leaves': 223}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386187	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357589	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336545	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319997	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273437	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305582	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256616	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294191	valid_1's F1_MACRO: 0.656527
[7]	training'

[I 2021-03-08 12:41:57,347] Trial 100 finished with value: 0.7975298761741301 and parameters: {'n_estimators': 500, 'lambda_l1': 0.00012761244980912765, 'lambda_l2': 1.4452060250559272e-05, 'max_depth': 17, 'num_leaves': 225}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.385794	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389797	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.354082	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.362017	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.329317	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.340084	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.309094	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.323044	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.29217	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.30914	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.276767	training's F1_MACRO: 0.574599	valid_1's binary_logloss: 0.297799	valid_1's F1_MACRO: 0.574945
[7]	training's 

[I 2021-03-08 12:42:00,648] Trial 101 finished with value: 0.7914405491417731 and parameters: {'n_estimators': 450, 'lambda_l1': 0.0004583421558800282, 'lambda_l2': 1.8608761339012245, 'max_depth': 17, 'num_leaves': 205}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386214	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357613	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336568	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320012	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273438	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305596	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256572	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294177	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:42:03,075] Trial 102 finished with value: 0.8031704066367469 and parameters: {'n_estimators': 450, 'lambda_l1': 3.454979067242396e-05, 'lambda_l2': 2.256559904439981e-06, 'max_depth': 17, 'num_leaves': 218}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377148	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386204	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341305	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357608	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314128	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336566	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292076	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320013	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273455	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305599	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256684	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.29441	valid_1's F1_MACRO: 0.658751
[7]	training's 

[I 2021-03-08 12:42:05,262] Trial 103 finished with value: 0.8105430787449364 and parameters: {'n_estimators': 500, 'lambda_l1': 0.0022206145573053235, 'lambda_l2': 2.430605066789022e-05, 'max_depth': 17, 'num_leaves': 229}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386202	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357604	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314115	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336559	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292061	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32001	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273439	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305593	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256572	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294175	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:42:08,046] Trial 104 finished with value: 0.8121855025159799 and parameters: {'n_estimators': 450, 'lambda_l1': 6.622904537963602e-05, 'lambda_l2': 1.5171578278633913e-05, 'max_depth': 20, 'num_leaves': 210}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357671	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314111	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336954	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292058	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320334	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27341	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.305808	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256625	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.294675	valid_1's F1_MACRO: 0.646087
[7]	training's 

[I 2021-03-08 12:42:10,687] Trial 105 finished with value: 0.8050942773517227 and parameters: {'n_estimators': 450, 'lambda_l1': 3.3469057489530135e-06, 'lambda_l2': 7.247231662007466e-08, 'max_depth': 20, 'num_leaves': 139}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386214	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357614	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314116	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336569	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292062	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320014	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273439	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305598	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256574	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294179	valid_1's F1_MACRO: 0.656527
[7]	training'

[I 2021-03-08 12:42:12,820] Trial 106 finished with value: 0.8091804705562355 and parameters: {'n_estimators': 400, 'lambda_l1': 0.00014340409922504693, 'lambda_l2': 1.0586003314757096e-05, 'max_depth': 17, 'num_leaves': 245}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377321	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386137	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341587	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357888	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314146	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336539	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320525	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273613	training's F1_MACRO: 0.590719	valid_1's binary_logloss: 0.307199	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.256885	training's F1_MACRO: 0.697307	valid_1's binary_logloss: 0.295436	valid_1's F1_MACRO: 0.653363
[7]	training'

[I 2021-03-08 12:42:14,710] Trial 107 finished with value: 0.8102724132516879 and parameters: {'n_estimators': 400, 'lambda_l1': 0.004586493402890713, 'lambda_l2': 1.8024681924937525e-07, 'max_depth': 14, 'num_leaves': 233}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.377146	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386218	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341302	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.35762	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314126	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336576	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292073	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320024	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273452	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305607	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256637	training's F1_MACRO: 0.70154	valid_1's binary_logloss: 0.294392	valid_1's F1_MACRO: 0.658751
[7]	training's binary_logloss: 0.241942	training's F1_MACRO: 0.758215	valid_1's

[I 2021-03-08 12:42:17,224] Trial 108 finished with value: 0.7962781854241677 and parameters: {'n_estimators': 400, 'lambda_l1': 0.0016753912848988797, 'lambda_l2': 2.6359874649929857e-06, 'max_depth': 17, 'num_leaves': 161}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377142	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386203	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341296	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357605	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314118	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336561	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292065	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320013	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273443	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305595	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256577	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294178	valid_1's F1_MACRO: 0.656527
[7]	training'

[I 2021-03-08 12:42:19,180] Trial 109 finished with value: 0.8116459149104668 and parameters: {'n_estimators': 500, 'lambda_l1': 0.0005246310215840022, 'lambda_l2': 2.575800286461542e-08, 'max_depth': 23, 'num_leaves': 224}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.380781	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.38972	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.346774	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.361323	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.319785	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.340354	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.298194	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32412	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.280066	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.310768	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.264612	training's F1_MACRO: 0.668447	valid_1's binary_logloss: 0.299868	valid_1's F1_MACRO: 0.640691
[7]	training's 

[I 2021-03-08 12:42:21,646] Trial 110 finished with value: 0.7885173644401833 and parameters: {'n_estimators': 400, 'lambda_l1': 1.797217300985832e-06, 'lambda_l2': 0.43972989177596306, 'max_depth': 20, 'num_leaves': 254}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357588	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336545	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292059	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319996	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273435	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305581	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256614	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.29419	valid_1's F1_MACRO: 0.656527
[7]	training's binary_logloss: 0.241987	training's F1_MACRO: 0.754337	valid_1's

[I 2021-03-08 12:42:24,302] Trial 111 finished with value: 0.807009447544516 and parameters: {'n_estimators': 400, 'lambda_l1': 6.468898686137136e-06, 'lambda_l2': 4.7418754250325315e-06, 'max_depth': 17, 'num_leaves': 220}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_col_wise=true` to remove the overhead.
[1]	training's binary_logloss: 0.377306	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386153	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341565	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357863	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.31412	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336491	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29211	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320502	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273578	training's F1_MACRO: 0.590719	valid_1's binary_logloss: 0.307169	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.256802	training's F1_MACRO: 0.697307	valid_1's binary_logloss: 0.295378	valid_1's F1_MACRO: 0.653363
[7]	training's binary_logloss: 0.241868	training's F1_MACRO: 0.75071	valid_1's 

[I 2021-03-08 12:42:26,180] Trial 112 finished with value: 0.8083505892508838 and parameters: {'n_estimators': 400, 'lambda_l1': 2.8337640667671826e-07, 'lambda_l2': 8.805740536528496e-06, 'max_depth': 14, 'num_leaves': 239}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.390985	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.393351	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.363881	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.366688	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.34397	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.347975	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.328377	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.332774	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.315885	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.32045	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.305554	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.309977	valid_1's F1_MACRO: 0.458219
[7]	training's 

[I 2021-03-08 12:42:27,279] Trial 113 finished with value: 0.796806727185176 and parameters: {'n_estimators': 400, 'lambda_l1': 7.439383227080413e-07, 'lambda_l2': 1.8924874850274134e-05, 'max_depth': 20, 'num_leaves': 3}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357589	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336545	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29206	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.319996	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273436	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305581	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256615	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294191	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:42:29,951] Trial 114 finished with value: 0.8110913765101313 and parameters: {'n_estimators': 400, 'lambda_l1': 1.3957594102106881e-05, 'lambda_l2': 3.642101128728046e-05, 'max_depth': 17, 'num_leaves': 232}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377141	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386215	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341295	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357615	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314116	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33657	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292062	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320014	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273439	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305597	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256574	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294178	valid_1's F1_MACRO: 0.656527
[7]	training's

[I 2021-03-08 12:42:32,591] Trial 115 finished with value: 0.8132839622476928 and parameters: {'n_estimators': 400, 'lambda_l1': 2.994037467728163e-05, 'lambda_l2': 7.25570686671371e-05, 'max_depth': 20, 'num_leaves': 212}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.377311	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.38613	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341573	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357876	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314129	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336504	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.29212	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320492	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273589	training's F1_MACRO: 0.590719	valid_1's binary_logloss: 0.30716	valid_1's F1_MACRO: 0.571061
[6]	training's binary_logloss: 0.256859	training's F1_MACRO: 0.697307	valid_1's binary_logloss: 0.295398	valid_1's F1_MACRO: 0.653363
[7]	training's b

[I 2021-03-08 12:42:35,124] Trial 116 finished with value: 0.8116178329719006 and parameters: {'n_estimators': 400, 'lambda_l1': 0.0013219856570511352, 'lambda_l2': 0.00011776697663845844, 'max_depth': 14, 'num_leaves': 227}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386186	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341294	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357667	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314111	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.336951	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292058	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320335	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.27341	training's F1_MACRO: 0.597253	valid_1's binary_logloss: 0.305808	valid_1's F1_MACRO: 0.559225
[6]	training's binary_logloss: 0.256624	training's F1_MACRO: 0.698571	valid_1's binary_logloss: 0.294676	valid_1's F1_MACRO: 0.646087
[7]	training's 

[I 2021-03-08 12:42:37,576] Trial 117 finished with value: 0.8033952726380711 and parameters: {'n_estimators': 400, 'lambda_l1': 1.9979166611300214e-07, 'lambda_l2': 1.4539706328759724e-06, 'max_depth': 17, 'num_leaves': 250}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.383642	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.389102	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.350934	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.361025	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.325806	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.340337	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.304353	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.324055	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.286642	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.310285	valid_1's F1_MACRO: 0.458219
[6]	training's binary_logloss: 0.271172	training's F1_MACRO: 0.650188	valid_1's binary_logloss: 0.298641	valid_1's F1_MACRO: 0.637356
[7]	training'

[I 2021-03-08 12:42:40,313] Trial 118 finished with value: 0.7973458964115503 and parameters: {'n_estimators': 450, 'lambda_l1': 7.247105025012235e-06, 'lambda_l2': 0.9451192336246578, 'max_depth': 20, 'num_leaves': 239}. Best is trial 42 with value: 0.8212005983952129.


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	training's binary_logloss: 0.37714	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.386198	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	training's binary_logloss: 0.341293	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.357572	valid_1's F1_MACRO: 0.458219
[3]	training's binary_logloss: 0.314114	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.33653	valid_1's F1_MACRO: 0.458219
[4]	training's binary_logloss: 0.292059	training's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.320004	valid_1's F1_MACRO: 0.458219
[5]	training's binary_logloss: 0.273435	training's F1_MACRO: 0.588836	valid_1's binary_logloss: 0.305589	valid_1's F1_MACRO: 0.558604
[6]	training's binary_logloss: 0.256614	training's F1_MACRO: 0.699797	valid_1's binary_logloss: 0.294197	valid_1's F1_MACRO: 0.656527
[7]	training's 

[I 2021-03-08 12:42:42,643] Trial 119 finished with value: 0.8140899260893355 and parameters: {'n_estimators': 400, 'lambda_l1': 9.730822454156799e-08, 'lambda_l2': 5.012064810607244e-06, 'max_depth': 17, 'num_leaves': 244}. Best is trial 42 with value: 0.8212005983952129.


Number of finished trials: 120
Best trial:
  Value: 0.8212005983952129
  Params: 
    n_estimators: 400
    lambda_l1: 8.379812902948931e-07
    lambda_l2: 9.52501649951279e-05
    max_depth: 20
    num_leaves: 208


In [94]:
trial.params

{'n_estimators': 400,
 'lambda_l1': 0.0016108530283158262,
 'lambda_l2': 8.609100631927998,
 'max_depth': 17,
 'num_leaves': 23}

In [33]:
trial.params

{'n_estimators': 400,
 'lambda_l1': 8.379812902948931e-07,
 'lambda_l2': 9.52501649951279e-05,
 'max_depth': 20,
 'num_leaves': 208}

In [87]:
# trial.distributions

In [29]:
# optuna.visualization.plot_optimization_history(study)

In [34]:
list(map(lambda t: t.values, study.get_trials()))

[[0.807009447544516],
 [0.8003705845248108],
 [0.81677257483596],
 [0.8050942773517227],
 [0.8097304744682683],
 [0.807009447544516],
 [0.8113686902075627],
 [0.8197518825622048],
 [0.81299365072143],
 [0.7978930316994833],
 [0.8077621635953864],
 [0.8086079457961195],
 [0.7986079809094524],
 [0.788271832071769],
 [0.8046156880230484],
 [0.8042493152596779],
 [0.8100015491329731],
 [0.7957248274749901],
 [0.8105430787449364],
 [0.8204229930775999],
 [0.8025320075674249],
 [0.7980331427791445],
 [0.8037845517954016],
 [0.8037845517954016],
 [0.8138649520526757],
 [0.7915823301729341],
 [0.8102724132516879],
 [0.7978930316994833],
 [0.8025320075674249],
 [0.7977122616384362],
 [0.8102724132516879],
 [0.8122001569438748],
 [0.8127531937550225],
 [0.798226217267668],
 [0.8001653746770025],
 [0.7990971781933142],
 [0.8023143873375257],
 [0.803619203206487],
 [0.8033952726380711],
 [0.8014491465246933],
 [0.7944852126579516],
 [0.7986079809094524],
 [0.8212005983952129],
 [0.8025320075674249

In [35]:
study.get_trials()[18]

FrozenTrial(number=18, values=[0.8105430787449364], datetime_start=datetime.datetime(2021, 3, 8, 12, 36, 12, 46760), datetime_complete=datetime.datetime(2021, 3, 8, 12, 36, 16, 727691), params={'n_estimators': 400, 'lambda_l1': 1.278535014544274e-05, 'lambda_l2': 9.693557882425107, 'max_depth': 11, 'num_leaves': 193}, distributions={'n_estimators': IntUniformDistribution(high=500, low=300, step=50), 'lambda_l1': LogUniformDistribution(high=10.0, low=1e-08), 'lambda_l2': LogUniformDistribution(high=10.0, low=1e-08), 'max_depth': IntUniformDistribution(high=23, low=8, step=3), 'num_leaves': IntUniformDistribution(high=256, low=2, step=1)}, user_attrs={}, system_attrs={}, intermediate_values={}, trial_id=18, state=TrialState.COMPLETE, value=None)

In [36]:
fit_params = {
    "eval_set":[(X_train, y_train), (X_val, y_val)], 
    "early_stopping_rounds":15,
    "eval_metric":[lambda y_true, y_pred: ("F1_MACRO", metric(y_true, np.round(y_pred)), True)],
    "feature_name":X_train.columns.tolist(),
    "categorical_feature":["Month", "TrafficType", "Browser", "SpecialDay", "OperatingSystems", "Region", "VisitorType", "Weekend"]
}
    
gbm = lgb.LGBMClassifier(**trial.params, verbose=0)
    
gbm.fit(X, y, **fit_params)

New categorical_feature is ['Browser', 'Month', 'OperatingSystems', 'Region', 'SpecialDay', 'TrafficType', 'VisitorType', 'Weekend']
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.




[1]	valid_0's binary_logloss: 0.377293	valid_0's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.37694	valid_1's F1_MACRO: 0.458219
Training until validation scores don't improve for 15 rounds
[2]	valid_0's binary_logloss: 0.341832	valid_0's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.340227	valid_1's F1_MACRO: 0.458219
[3]	valid_0's binary_logloss: 0.314632	valid_0's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.313069	valid_1's F1_MACRO: 0.458219
[4]	valid_0's binary_logloss: 0.29219	valid_0's F1_MACRO: 0.458158	valid_1's binary_logloss: 0.290113	valid_1's F1_MACRO: 0.458219
[5]	valid_0's binary_logloss: 0.272547	valid_0's F1_MACRO: 0.591658	valid_1's binary_logloss: 0.270889	valid_1's F1_MACRO: 0.605727
[6]	valid_0's binary_logloss: 0.255767	valid_0's F1_MACRO: 0.691551	valid_1's binary_logloss: 0.253714	valid_1's F1_MACRO: 0.695097
[7]	valid_0's binary_logloss: 0.241082	valid_0's F1_MACRO: 0.745905	valid_1's binary_logloss: 0.23945	valid_1's F1_MACRO: 0.750263
[8]	valid_0's bina

LGBMClassifier(lambda_l1=8.379812902948931e-07, lambda_l2=9.52501649951279e-05,
               max_depth=20, n_estimators=400, num_leaves=208, verbose=0)

In [37]:
metric(y, gbm.predict(X))

0.9993347953807932

In [38]:
ids = test.id
test.drop(columns=["id"], inplace=True)

In [39]:
result = gbm.predict(test)

In [40]:
from datetime import datetime
get_date = lambda : datetime.now().strftime("%Y%m%d_%H%M%S")

In [41]:
pd.DataFrame({"id":ids, "revenue":result}).to_csv(f'../data/results/{get_date()}_lgb_opt.csv', index=False)

In [42]:
gbm._Booster.save_model(f'../data/results/{get_date()}_lgb_opt_model.txt')

<lightgbm.basic.Booster at 0x7f72b6852a90>