# LightGBM Hyperparameter Sweep 20210922
Integrating some enhancements introduced in the XGBoost version, and implementing the frequent-serialization approach.

# Setup

In [1]:
# two manual flags (ex-config)
colab = False
gpu_available = False

In [2]:
# basic imports
from pathlib import Path
import os
import math
from datetime import datetime
import random
import multiprocessing
import pickle

In [3]:
%matplotlib inline
%config Completer.use_jedi = False
os.environ['WANDB_NOTEBOOK_NAME'] = f"sweep_lightgbm_{datetime.now().strftime('%Y%m%d')}.ipynb"

In [4]:
# handle Google Colab-specific library installation/updating
if colab:
    # much of the below inspired by or cribbed from the May 2021 Kaggle Tabular Playground winner, at 
    # https://colab.research.google.com/gist/academicsuspect/0aac7bd6e506f5f70295bfc9a3dc2250/tabular-may-baseline.ipynb?authuser=1#scrollTo=LJoVKJb5wN0L
    
    # Kaggle API for downloading the datasets
    !pip install --upgrade -q kaggle

    # weights and biases
    !pip install -qqqU wandb
    
    # Optuna for parameter search
    !pip install -q optuna

    # !pip install --upgrade xgboost

    # upgrade sklearn
    !pip install --upgrade scikit-learn

    # !pip install category_encoders
    # !pip install catboost
    !pip install --upgrade -q lightgbm

    # lighgbm gpu compatible
    # !git clone --recursive https://github.com/Microsoft/LightGBM
    # ! cd LightGBM && rm -rf build && mkdir build && cd build && cmake -DUSE_GPU=1 ../../LightGBM && make -j4 && cd ../python-package && python3 setup.py install --precompile --gpu;
    
    # # this part is from https://github.com/rapidsai/gputreeshap/issues/24
    # !pip install cmake --upgrade
    # # !pip install sklearn --upgrade
    # !git clone --recursive https://github.com/dmlc/xgboost
    # %cd /content/xgboost
    # !mkdir build
    # %cd build
    # !cmake .. -DUSE_CUDA=ON
    # !make -j4
    # %cd /content/xgboost/python-package
    # !python setup.py install --use-cuda --use-nccl
    # !/opt/bin/nvidia-smi
    # !pip install shap
    

Now, non-stdlib imports

In [5]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from tqdm.notebook import tqdm

# general ML tooling
from sklearn.model_selection import train_test_split, StratifiedKFold, KFold
from sklearn.metrics import log_loss, roc_auc_score
import wandb
from optuna.integration.wandb import WeightsAndBiasesCallback
# from wandb.xgboost import wandb_callback
# from wandb.lightgbm import wandb_callback
# from sklearn.impute import KNNImputer, StandardImputer
# import timm

import seaborn as sns

# from catboost import CatBoostClassifier
# from xgboost import XGBClassifier
from lightgbm import LGBMClassifier
# from sklearn.ensemble import RandomForestRegressor
from sklearn.preprocessing import MaxAbsScaler, StandardScaler, MinMaxScaler, RobustScaler, PolynomialFeatures
# from sklearn.feature_selection import SelectKBest, f_regression
from joblib import dump, load
# feature engineering tools
# from sklearn.feature_selection import mutual_info_regression
# import featuretools as ft


from optuna.samplers import TPESampler
import optuna
# import catboost
from sklearn.utils import resample
import sklearn.metrics

Now, datapath setup

In [6]:
# # This is the code for reading the train.csv and converting it to a .feather file
# df = pd.read_csv(datapath/'train.csv', index_col='id', low_memory=False)
# df.index.name = None
# df.to_feather(path='./dataset_df.feather')

In [7]:
if colab:
    # mount Google Drive
    from google.colab import drive
    drive.mount('/content/drive')
    
    # handling datapath
    datapath = Path('/content/drive/MyDrive/kaggle/tabular_playgrounds/sep2021/')
    
else:
    # if on local machine
    datapath = Path('/media/sf/easystore/kaggle_data/tabular_playgrounds/sep2021/')    
    


In [8]:

# n_trials = int(1000)
SEED = 42

In [9]:
# Function to seed everything
def seed_everything(seed):
    random.seed(seed)
    np.random.seed(seed)
    os.environ['PYTHONHASHSEED'] = str(seed)
seed_everything(SEED)

## Ex-Model Config

In [10]:
# meta-config for preprocessing and cross-validation, but NOT for model parameters
# in the sweep version, this includes both ex-model parameters and defaults for model parameters
exmodel_config = {
    # model config
    "library": 'lightgbm',
#     "model": XGBClassifier,
#     "n_estimators": 100, 
#     "max_depth": 3,
#     "learning_rate": 0.1,
#     "test_size": 0.2,
#     "reg_lambda": None, 
    "scaler": "sklearn.preprocessing.StandardScaler()", # TODO: experiment with others (but imputation may be slow)
    "scale_b4_impute": False,
    "imputer": "sklearn.impute.SimpleImputer(strategy='median', add_indicator=True)",
    "knn_imputer_n_neighbors": None, # None if a different imputer is used
#     "feature_selector": SelectKBest,
#     "k_best": 80,
#     "feature_selection_scoring": f_regression,
    'random_state': SEED,
    'optuna': True,
    'optuna_trials': 100,
#     'subsample': 1,
#     'cross_val_strategy': None, # None for holdout, or the relevant sklearn class
#     'kfolds': 1, # if 1, that means just doing holdout
#     'test_size': 0.2,
    # these are XGBoost default (my choice) params 
#     "tree_method": "auto", # set to 'gpu_hist' to try GPU if available
#     "booster": 'gbtree', # dart may be marginally better, but will opt for this quicker approach as a default
#     "n_estimators": 200, 
#     "max_depth": 3,
#     "learning_rate": 0.1,
#     "n_jobs": -1,
#     "verbosity": 1,
#     "subsample": 1,
#     'features_created': False,
#     'feature_creator': None,
}

wandb_kwargs = {
    # wandb config
    'name': f"{os.environ['WANDB_NOTEBOOK_NAME'][:-6]}_{datetime.now().strftime('%H%M%S')}", # just removes the .ipynb extension, leaving the notebook filename's stem
    'project': '202109_Kaggle_tabular_playground',
    'tags': ['sweep'],
    'notes': "Integrating some enhancements introduced in the XGBoost version, and implementing the frequent-serialization approach.",
    'config': exmodel_config,
}

## Data Setup

**TODO** Write some conditional logic here to automate it -- possibly as part of a sklearn.*pipeline

In [11]:
X_source = 'X_NaNcounts_SummaryStats_imputed-Median-wIndicators-StandardScaled.feather'
X_train = pd.read_feather(datapath/X_source) 
y_train = load(datapath/'y.joblib')    
# X.index.name = 'id'
# y.index.name = 'id'
X = np.array(X_train)
y = np.array(y_train)

del X_train, y_train

In [12]:
exmodel_config['feature_count'] = X.shape[1]
exmodel_config['feature_generator'] = "Summary statistics"
exmodel_config['X_source'] = X_source

# Experiment setup

In [13]:
# wandb_kwargs = {
#     # wandb config:
#     'name': f"{os.environ['WANDB_NOTEBOOK_NAME'][:-6]}_{datetime.now().strftime('%H%M%S')}", # just removes the .ipynb extension, leaving the notebook filename's stem
#     'project': '202109_Kaggle_tabular_playground',
#     'tags': ['sweep'],
#     'notes': "Sweep for CatBoost using Optuna",
#     'config': exmodel_config,
# }

In [14]:
# originally from https://www.kaggle.com/satorushibata/optimize-catboost-hyperparameter-with-optuna-gpu
def objective(trial):
    # split the (original Kaggle training) data into partitions
    # if study.best_trial:
    #     print("Dumping best params, which are:")
    #     print(str(study.best_trial.params))
    #     dump(study.best_trial.params, filename=datapath/'optuna_catboost_best_20210920.joblib')
       
    # else:
    #     print("No best study yet")
    X_train, X_valid, y_train, y_valid = train_test_split(X, y, test_size=0.33, random_state=int(SEED), shuffle=True)
    # create wrappers for the training and validation partitions
    # train_pool = catboost.Pool(X_train, y_train)
    # valid_pool = catboost.Pool(X_valid, y_valid)
    
    # experimental parameters
    params = {
        'n_estimators': trial.suggest_int('n_estimators', 900, 4500),
        'max_depth' : trial.suggest_int('depth', 3, 12),                                       
        'learning_rate' : trial.suggest_loguniform('learning_rate', 0.001, 0.4),               
        'reg_alpha': trial.suggest_loguniform('reg_alpha', 0.001, 30),
        'reg_lambda': trial.suggest_loguniform('reg_lambda', 0.001, 30),
        'subsample': trial.suggest_uniform('subsample', 0.5, 1), # aka bagging_fraction
        'boosting_type': trial.suggest_categorical('boosting_type', ['gbdt', 'dart', 'goss']),
        'min_child_samples': trial.suggest_int('min_child_samples', 4, 75),
        'num_leaves': trial.suggest_int('num_leaves', 50, 250),
        'colsample_bytree': trial.suggest_uniform('colsample_bytree', 0.5, 1), # aka feature_fraction
    }  

    # instantiate the model, with some parameters locked in, and experimnental ones passed via splat 
    model = LGBMClassifier(
        objective='binary',
        random_state=SEED,
        n_jobs=-1,
        eval_metric='auc',
        device_type='cpu',
#         max_bin=63,
        **params
    )       

    model.fit(X_train, y_train)
    # generate predictions
    preds = model.predict_proba(X_valid)[:,1]
    # rounds to the nearest integer, and the nearest even in case of _.5s

    # Evaluation
    valid_auc = roc_auc_score(y_valid, preds)
    print('ROC AUC Score of XGBoost =', valid_auc)
    wandb.log({'valid_auc': valid_auc,
              })

    return valid_auc

In [15]:
wandbc = WeightsAndBiasesCallback(wandb_kwargs=wandb_kwargs)

  wandbc = WeightsAndBiasesCallback(wandb_kwargs=wandb_kwargs)
[34m[1mwandb[0m: Currently logged in as: [33mhushifang[0m (use `wandb login --relogin` to force relogin)


In [16]:
study = optuna.create_study(direction = "maximize", 
                            sampler = TPESampler(seed=int(SEED)), 
                            study_name='lightgbm_20210922')

# study = load(datapath/f'optuna_lightgbm_study_5trials_20210922.joblib')


[32m[I 2021-09-23 05:37:41,320][0m A new study created in memory with name: lightgbm_20210922[0m


In [17]:

for x in range(1,21):
    study.optimize(objective, n_trials = 5, callbacks = [wandbc]) #n_jobs = multiprocessing.cpu_count())
    print(f"{x*5} trials complete")
    dump(study, filename=datapath/f'optuna_lightgbm_study_{x*5}trials_20210922.joblib')
    dump(study.best_trial.params, filename=datapath/f'optuna_lightgbm_study_best-thru-{x*5}trials_20210922.joblib')



[32m[I 2021-09-23 05:49:06,766][0m Trial 0 finished with value: 0.8109411190089265 and parameters: {'n_estimators': 2248, 'depth': 12, 'learning_rate': 0.0802956743641955, 'reg_alpha': 0.4789240251631179, 'reg_lambda': 0.004994757081068292, 'subsample': 0.5779972601681014, 'boosting_type': 'dart', 'min_child_samples': 54, 'num_leaves': 54, 'colsample_bytree': 0.9849549260809971}. Best is trial 0 with value: 0.8109411190089265.[0m


ROC AUC Score of XGBoost = 0.8109411190089265


[32m[I 2021-09-23 05:51:26,485][0m Trial 1 finished with value: 0.8132354513292246 and parameters: {'n_estimators': 3897, 'depth': 5, 'learning_rate': 0.002972483637079397, 'reg_alpha': 0.0066240595682091315, 'reg_lambda': 0.023021277110080198, 'subsample': 0.762378215816119, 'boosting_type': 'goss', 'min_child_samples': 14, 'num_leaves': 108, 'colsample_bytree': 0.6831809216468459}. Best is trial 1 with value: 0.8132354513292246.[0m


ROC AUC Score of XGBoost = 0.8132354513292246


[32m[I 2021-09-23 06:00:33,535][0m Trial 2 finished with value: 0.8130550071111211 and parameters: {'n_estimators': 2542, 'depth': 10, 'learning_rate': 0.003307982168695265, 'reg_alpha': 0.20058106556780586, 'reg_lambda': 0.4490677404109781, 'subsample': 0.5232252063599989, 'boosting_type': 'gbdt', 'min_child_samples': 72, 'num_leaves': 244, 'colsample_bytree': 0.9041986740582306}. Best is trial 1 with value: 0.8132354513292246.[0m


ROC AUC Score of XGBoost = 0.8130550071111211


[32m[I 2021-09-23 06:05:26,893][0m Trial 3 finished with value: 0.8123773749812568 and parameters: {'n_estimators': 1996, 'depth': 3, 'learning_rate': 0.06031361827702156, 'reg_alpha': 0.09345791438428568, 'reg_lambda': 0.0035186816415472676, 'subsample': 0.7475884550556351, 'boosting_type': 'dart', 'min_child_samples': 51, 'num_leaves': 112, 'colsample_bytree': 0.7600340105889054}. Best is trial 1 with value: 0.8132354513292246.[0m


ROC AUC Score of XGBoost = 0.8123773749812568


[32m[I 2021-09-23 06:12:33,315][0m Trial 4 finished with value: 0.8103583447917344 and parameters: {'n_estimators': 2868, 'depth': 4, 'learning_rate': 0.3333629787709382, 'reg_alpha': 2.953681335681259, 'reg_lambda': 16.078690668199, 'subsample': 0.9474136752138245, 'boosting_type': 'dart', 'min_child_samples': 18, 'num_leaves': 59, 'colsample_bytree': 0.6626651653816322}. Best is trial 1 with value: 0.8132354513292246.[0m


ROC AUC Score of XGBoost = 0.8103583447917344
5 trials complete


[32m[I 2021-09-23 06:20:34,139][0m Trial 5 finished with value: 0.8126073824703403 and parameters: {'n_estimators': 2299, 'depth': 5, 'learning_rate': 0.14335891845548843, 'reg_alpha': 0.039557414824905594, 'reg_lambda': 0.018104138546410155, 'subsample': 0.7713480415791243, 'boosting_type': 'dart', 'min_child_samples': 75, 'num_leaves': 205, 'colsample_bytree': 0.5993578407670862}. Best is trial 1 with value: 0.8132354513292246.[0m


ROC AUC Score of XGBoost = 0.8126073824703403


[32m[I 2021-09-23 06:21:39,916][0m Trial 6 finished with value: 0.8044614976683523 and parameters: {'n_estimators': 919, 'depth': 11, 'learning_rate': 0.06906932535689181, 'reg_alpha': 1.8359188752396374, 'reg_lambda': 2.838382119353614, 'subsample': 0.5370223258670452, 'boosting_type': 'goss', 'min_child_samples': 48, 'num_leaves': 116, 'colsample_bytree': 0.5317791751430119}. Best is trial 1 with value: 0.8132354513292246.[0m


ROC AUC Score of XGBoost = 0.8044614976683523


[32m[I 2021-09-23 06:23:00,972][0m Trial 7 finished with value: 0.8043960772297594 and parameters: {'n_estimators': 2019, 'depth': 6, 'learning_rate': 0.07915512627905745, 'reg_alpha': 0.715191107817528, 'reg_lambda': 9.37905380401463, 'subsample': 0.7361074625809747, 'boosting_type': 'goss', 'min_child_samples': 44, 'num_leaves': 204, 'colsample_bytree': 0.7468977981821954}. Best is trial 1 with value: 0.8132354513292246.[0m


ROC AUC Score of XGBoost = 0.8043960772297594


[32m[I 2021-09-23 06:26:38,121][0m Trial 8 finished with value: 0.8104377949525725 and parameters: {'n_estimators': 2782, 'depth': 7, 'learning_rate': 0.0011645069711410827, 'reg_alpha': 0.0030411861290916427, 'reg_lambda': 0.0013826500550053445, 'subsample': 0.8182052056318903, 'boosting_type': 'goss', 'min_child_samples': 21, 'num_leaves': 132, 'colsample_bytree': 0.8777755692715243}. Best is trial 1 with value: 0.8132354513292246.[0m


ROC AUC Score of XGBoost = 0.8104377949525725


[32m[I 2021-09-23 06:29:36,875][0m Trial 9 finished with value: 0.8043104238542168 and parameters: {'n_estimators': 1723, 'depth': 3, 'learning_rate': 0.005674801345779974, 'reg_alpha': 0.005269959187361842, 'reg_lambda': 14.533463349735559, 'subsample': 0.9040601897822085, 'boosting_type': 'dart', 'min_child_samples': 17, 'num_leaves': 229, 'colsample_bytree': 0.7696711209578253}. Best is trial 1 with value: 0.8132354513292246.[0m


ROC AUC Score of XGBoost = 0.8043104238542168
10 trials complete


[32m[I 2021-09-23 06:37:57,448][0m Trial 10 finished with value: 0.8152310287561186 and parameters: {'n_estimators': 4296, 'depth': 9, 'learning_rate': 0.013146994020643898, 'reg_alpha': 14.927150287453346, 'reg_lambda': 0.060027906631665434, 'subsample': 0.650282411524673, 'boosting_type': 'gbdt', 'min_child_samples': 4, 'num_leaves': 164, 'colsample_bytree': 0.5061555847824689}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8152310287561186


[32m[I 2021-09-23 06:48:37,499][0m Trial 11 finished with value: 0.8147020969270298 and parameters: {'n_estimators': 4380, 'depth': 9, 'learning_rate': 0.013670896348907332, 'reg_alpha': 9.7063443785187, 'reg_lambda': 0.05768852026747195, 'subsample': 0.659143125062404, 'boosting_type': 'gbdt', 'min_child_samples': 4, 'num_leaves': 165, 'colsample_bytree': 0.5024954066104743}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8147020969270298


[32m[I 2021-09-23 06:59:56,835][0m Trial 12 finished with value: 0.8145904386220185 and parameters: {'n_estimators': 4394, 'depth': 9, 'learning_rate': 0.016580556306530374, 'reg_alpha': 16.60428022989559, 'reg_lambda': 0.14834757978345897, 'subsample': 0.6394987085406625, 'boosting_type': 'gbdt', 'min_child_samples': 5, 'num_leaves': 168, 'colsample_bytree': 0.5014758171629863}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8145904386220185


[32m[I 2021-09-23 07:08:00,025][0m Trial 13 finished with value: 0.8150837572828855 and parameters: {'n_estimators': 3631, 'depth': 8, 'learning_rate': 0.016475802815567774, 'reg_alpha': 29.294526487900082, 'reg_lambda': 0.1260044241770458, 'subsample': 0.6550186135528008, 'boosting_type': 'gbdt', 'min_child_samples': 4, 'num_leaves': 167, 'colsample_bytree': 0.5647970910674268}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8150837572828855


[32m[I 2021-09-23 07:15:11,779][0m Trial 14 finished with value: 0.8136765937268259 and parameters: {'n_estimators': 3597, 'depth': 8, 'learning_rate': 0.028446408092945765, 'reg_alpha': 28.43385875316184, 'reg_lambda': 0.9639028133940841, 'subsample': 0.6531935324498377, 'boosting_type': 'gbdt', 'min_child_samples': 30, 'num_leaves': 186, 'colsample_bytree': 0.5905972980483933}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8136765937268259
15 trials complete


[32m[I 2021-09-23 07:21:36,697][0m Trial 15 finished with value: 0.814993070286495 and parameters: {'n_estimators': 3466, 'depth': 8, 'learning_rate': 0.010119976084128488, 'reg_alpha': 5.162661397711135, 'reg_lambda': 0.1601045105396843, 'subsample': 0.610558729370589, 'boosting_type': 'gbdt', 'min_child_samples': 29, 'num_leaves': 146, 'colsample_bytree': 0.5861438988850267}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.814993070286495


[32m[I 2021-09-23 07:27:34,393][0m Trial 16 finished with value: 0.8139733282307049 and parameters: {'n_estimators': 3266, 'depth': 10, 'learning_rate': 0.032219069785396424, 'reg_alpha': 27.080546923262805, 'reg_lambda': 0.631703656793269, 'subsample': 0.7152260414518053, 'boosting_type': 'gbdt', 'min_child_samples': 33, 'num_leaves': 91, 'colsample_bytree': 0.6601698676289585}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8139733282307049


[32m[I 2021-09-23 07:34:41,644][0m Trial 17 finished with value: 0.814784956755386 and parameters: {'n_estimators': 4030, 'depth': 7, 'learning_rate': 0.005808401416914259, 'reg_alpha': 1.3660854168362042, 'reg_lambda': 0.03984202321271438, 'subsample': 0.8363798754988963, 'boosting_type': 'gbdt', 'min_child_samples': 9, 'num_leaves': 181, 'colsample_bytree': 0.5607128538634181}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.814784956755386


[32m[I 2021-09-23 07:42:19,273][0m Trial 18 finished with value: 0.8126163076987853 and parameters: {'n_estimators': 3876, 'depth': 9, 'learning_rate': 0.030628330142560105, 'reg_alpha': 5.9993864159650645, 'reg_lambda': 0.009488630156757523, 'subsample': 0.6897497590842712, 'boosting_type': 'gbdt', 'min_child_samples': 62, 'num_leaves': 145, 'colsample_bytree': 0.6285849284333573}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8126163076987853


[32m[I 2021-09-23 07:49:06,741][0m Trial 19 finished with value: 0.8144734211529314 and parameters: {'n_estimators': 3156, 'depth': 12, 'learning_rate': 0.007650049377416364, 'reg_alpha': 0.026614930787972578, 'reg_lambda': 0.10405086732081568, 'subsample': 0.5837072778789432, 'boosting_type': 'gbdt', 'min_child_samples': 24, 'num_leaves': 201, 'colsample_bytree': 0.7126823088369375}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8144734211529314
20 trials complete


[32m[I 2021-09-23 07:53:29,020][0m Trial 20 finished with value: 0.8110116138388287 and parameters: {'n_estimators': 4228, 'depth': 6, 'learning_rate': 0.0017589068586290903, 'reg_alpha': 9.830490064255892, 'reg_lambda': 2.2287583374364384, 'subsample': 0.8362173013322499, 'boosting_type': 'gbdt', 'min_child_samples': 37, 'num_leaves': 82, 'colsample_bytree': 0.5554186356630381}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8110116138388287


[32m[I 2021-09-23 08:00:39,496][0m Trial 21 finished with value: 0.8150128553087874 and parameters: {'n_estimators': 3543, 'depth': 8, 'learning_rate': 0.010244962359992175, 'reg_alpha': 4.867818061585001, 'reg_lambda': 0.2708366569898743, 'subsample': 0.6044050108505046, 'boosting_type': 'gbdt', 'min_child_samples': 12, 'num_leaves': 146, 'colsample_bytree': 0.6117849689803644}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8150128553087874


[32m[I 2021-09-23 08:06:47,821][0m Trial 22 finished with value: 0.8141077485822792 and parameters: {'n_estimators': 3413, 'depth': 8, 'learning_rate': 0.01914105425750848, 'reg_alpha': 4.327784861498706, 'reg_lambda': 0.3059095471227339, 'subsample': 0.5719017394423589, 'boosting_type': 'gbdt', 'min_child_samples': 11, 'num_leaves': 156, 'colsample_bytree': 0.6243669366184729}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8141077485822792


[32m[I 2021-09-23 08:15:10,785][0m Trial 23 finished with value: 0.8151323078372185 and parameters: {'n_estimators': 3725, 'depth': 10, 'learning_rate': 0.011764553202969125, 'reg_alpha': 14.304749530372794, 'reg_lambda': 0.07404435526330139, 'subsample': 0.6904823969499871, 'boosting_type': 'gbdt', 'min_child_samples': 9, 'num_leaves': 128, 'colsample_bytree': 0.5473088831250538}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8151323078372185


[32m[I 2021-09-23 08:24:19,982][0m Trial 24 finished with value: 0.814751120434728 and parameters: {'n_estimators': 3809, 'depth': 10, 'learning_rate': 0.004463186879923906, 'reg_alpha': 11.470943473345589, 'reg_lambda': 0.06767773989441055, 'subsample': 0.6920028757573445, 'boosting_type': 'gbdt', 'min_child_samples': 4, 'num_leaves': 128, 'colsample_bytree': 0.5393966042477416}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.814751120434728
25 trials complete


[32m[I 2021-09-23 08:39:58,250][0m Trial 25 finished with value: 0.81263141874894 and parameters: {'n_estimators': 4130, 'depth': 11, 'learning_rate': 0.024266426653377665, 'reg_alpha': 28.694349064041038, 'reg_lambda': 0.025173738232261125, 'subsample': 0.690159198305991, 'boosting_type': 'gbdt', 'min_child_samples': 23, 'num_leaves': 180, 'colsample_bytree': 0.821459231082915}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.81263141874894


[32m[I 2021-09-23 08:44:23,830][0m Trial 26 finished with value: 0.8101901532481627 and parameters: {'n_estimators': 3069, 'depth': 11, 'learning_rate': 0.04671729032555551, 'reg_alpha': 0.001164601239126006, 'reg_lambda': 0.011375216839085907, 'subsample': 0.7995197872145816, 'boosting_type': 'gbdt', 'min_child_samples': 10, 'num_leaves': 130, 'colsample_bytree': 0.5042037411144846}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8101901532481627


[32m[I 2021-09-23 08:49:09,652][0m Trial 27 finished with value: 0.8148212852980968 and parameters: {'n_estimators': 3718, 'depth': 9, 'learning_rate': 0.010073378516546907, 'reg_alpha': 1.1407411965526941, 'reg_lambda': 0.08632574656645059, 'subsample': 0.6384155081474046, 'boosting_type': 'gbdt', 'min_child_samples': 17, 'num_leaves': 96, 'colsample_bytree': 0.5630155955687722}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8148212852980968


[32m[I 2021-09-23 08:58:51,311][0m Trial 28 finished with value: 0.8143546769136955 and parameters: {'n_estimators': 4354, 'depth': 10, 'learning_rate': 0.014368014620575466, 'reg_alpha': 0.3831123847669165, 'reg_lambda': 1.2092205163840761, 'subsample': 0.546651296060422, 'boosting_type': 'gbdt', 'min_child_samples': 8, 'num_leaves': 164, 'colsample_bytree': 0.540671715933468}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8143546769136955


[32m[I 2021-09-23 09:06:34,055][0m Trial 29 finished with value: 0.8019464078100311 and parameters: {'n_estimators': 3952, 'depth': 12, 'learning_rate': 0.04319810397035442, 'reg_alpha': 14.003943390439431, 'reg_lambda': 0.004969683439285412, 'subsample': 0.5056261752363385, 'boosting_type': 'goss', 'min_child_samples': 25, 'num_leaves': 224, 'colsample_bytree': 0.9698707456902115}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8019464078100311
30 trials complete


[32m[I 2021-09-23 09:30:42,563][0m Trial 30 finished with value: 0.8075879758427639 and parameters: {'n_estimators': 4134, 'depth': 7, 'learning_rate': 0.11457467947739161, 'reg_alpha': 2.480197924333022, 'reg_lambda': 0.03848121078456201, 'subsample': 0.6132916558551728, 'boosting_type': 'dart', 'min_child_samples': 15, 'num_leaves': 191, 'colsample_bytree': 0.6431157564921246}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8075879758427639


[32m[I 2021-09-23 09:37:28,958][0m Trial 31 finished with value: 0.8149761920359844 and parameters: {'n_estimators': 3564, 'depth': 8, 'learning_rate': 0.008721779762572837, 'reg_alpha': 6.948752038823637, 'reg_lambda': 0.35073805264014213, 'subsample': 0.5929629510980321, 'boosting_type': 'gbdt', 'min_child_samples': 12, 'num_leaves': 151, 'colsample_bytree': 0.5956297959432378}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8149761920359844


[32m[I 2021-09-23 09:45:27,586][0m Trial 32 finished with value: 0.8150567890937215 and parameters: {'n_estimators': 3294, 'depth': 9, 'learning_rate': 0.012514854209140152, 'reg_alpha': 15.662032211243902, 'reg_lambda': 0.23628397737956083, 'subsample': 0.6692668695781789, 'boosting_type': 'gbdt', 'min_child_samples': 8, 'num_leaves': 136, 'colsample_bytree': 0.7009106099270098}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8150567890937215


[32m[I 2021-09-23 09:52:34,981][0m Trial 33 finished with value: 0.8135388091016496 and parameters: {'n_estimators': 3026, 'depth': 9, 'learning_rate': 0.0033040409566659004, 'reg_alpha': 16.729548842527024, 'reg_lambda': 0.16622230266349114, 'subsample': 0.6701193999586511, 'boosting_type': 'gbdt', 'min_child_samples': 7, 'num_leaves': 135, 'colsample_bytree': 0.7241772540708304}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8135388091016496


[32m[I 2021-09-23 09:59:39,975][0m Trial 34 finished with value: 0.814955189584095 and parameters: {'n_estimators': 3279, 'depth': 10, 'learning_rate': 0.013757253153723533, 'reg_alpha': 15.65427358612387, 'reg_lambda': 0.029611248575007233, 'subsample': 0.7207711701214681, 'boosting_type': 'gbdt', 'min_child_samples': 4, 'num_leaves': 113, 'colsample_bytree': 0.6946726425474131}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.814955189584095
35 trials complete


[32m[I 2021-09-23 10:11:01,982][0m Trial 35 finished with value: 0.8145071376240444 and parameters: {'n_estimators': 3655, 'depth': 11, 'learning_rate': 0.006554998717101214, 'reg_alpha': 3.153956009833402, 'reg_lambda': 0.5413536818623761, 'subsample': 0.771271610605371, 'boosting_type': 'gbdt', 'min_child_samples': 57, 'num_leaves': 175, 'colsample_bytree': 0.8369248285788846}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8145071376240444


[32m[I 2021-09-23 10:34:15,771][0m Trial 36 finished with value: 0.8084516471309667 and parameters: {'n_estimators': 4490, 'depth': 9, 'learning_rate': 0.002190497117581839, 'reg_alpha': 0.2327352822464566, 'reg_lambda': 0.01302918483074436, 'subsample': 0.7115054012333606, 'boosting_type': 'dart', 'min_child_samples': 19, 'num_leaves': 72, 'colsample_bytree': 0.5745438338278541}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8084516471309667


[32m[I 2021-09-23 10:36:18,533][0m Trial 37 finished with value: 0.8113365525753758 and parameters: {'n_estimators': 2432, 'depth': 10, 'learning_rate': 0.01824080099775213, 'reg_alpha': 0.0537691175534489, 'reg_lambda': 0.09649492219733706, 'subsample': 0.6323133362270668, 'boosting_type': 'goss', 'min_child_samples': 13, 'num_leaves': 118, 'colsample_bytree': 0.532627010086967}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8113365525753758


[32m[I 2021-09-23 10:40:31,099][0m Trial 38 finished with value: 0.8136140132100682 and parameters: {'n_estimators': 3854, 'depth': 6, 'learning_rate': 0.004219416907479407, 'reg_alpha': 9.062039128685567, 'reg_lambda': 0.05629601653446601, 'subsample': 0.5582403948266071, 'boosting_type': 'gbdt', 'min_child_samples': 8, 'num_leaves': 160, 'colsample_bytree': 0.68171920922992}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8136140132100682


[32m[I 2021-09-23 10:56:50,877][0m Trial 39 finished with value: 0.8134037304182056 and parameters: {'n_estimators': 2921, 'depth': 7, 'learning_rate': 0.041557085530606, 'reg_alpha': 22.10156317813697, 'reg_lambda': 0.22984812170341015, 'subsample': 0.7484585501752069, 'boosting_type': 'dart', 'min_child_samples': 15, 'num_leaves': 102, 'colsample_bytree': 0.6525095024077675}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8134037304182056
40 trials complete


[32m[I 2021-09-23 10:58:41,157][0m Trial 40 finished with value: 0.8118220374232437 and parameters: {'n_estimators': 982, 'depth': 11, 'learning_rate': 0.02291995645107263, 'reg_alpha': 1.017426549040932, 'reg_lambda': 1.7377991221837494, 'subsample': 0.6765297033649901, 'boosting_type': 'goss', 'min_child_samples': 67, 'num_leaves': 136, 'colsample_bytree': 0.5190399146434892}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8118220374232437


[32m[I 2021-09-23 11:05:06,848][0m Trial 41 finished with value: 0.8146212573681091 and parameters: {'n_estimators': 2588, 'depth': 8, 'learning_rate': 0.011781110207541422, 'reg_alpha': 3.380352203422758, 'reg_lambda': 0.297436715803267, 'subsample': 0.6218409976490955, 'boosting_type': 'gbdt', 'min_child_samples': 13, 'num_leaves': 144, 'colsample_bytree': 0.7879047803352189}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8146212573681091


[32m[I 2021-09-23 11:12:52,167][0m Trial 42 finished with value: 0.8150089987874044 and parameters: {'n_estimators': 3266, 'depth': 9, 'learning_rate': 0.008880753021800433, 'reg_alpha': 6.429006443572501, 'reg_lambda': 0.6408484158388579, 'subsample': 0.6047330053577136, 'boosting_type': 'gbdt', 'min_child_samples': 8, 'num_leaves': 125, 'colsample_bytree': 0.6164600751716469}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8150089987874044


[32m[I 2021-09-23 11:18:37,949][0m Trial 43 finished with value: 0.8146531498364264 and parameters: {'n_estimators': 3445, 'depth': 8, 'learning_rate': 0.011581519592132114, 'reg_alpha': 1.8798367440312813, 'reg_lambda': 0.11549607943576999, 'subsample': 0.999007865737431, 'boosting_type': 'gbdt', 'min_child_samples': 20, 'num_leaves': 173, 'colsample_bytree': 0.6061690867141181}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8146531498364264


[32m[I 2021-09-23 11:25:55,138][0m Trial 44 finished with value: 0.8139976786239942 and parameters: {'n_estimators': 3620, 'depth': 7, 'learning_rate': 0.004813666194634082, 'reg_alpha': 17.386781035900846, 'reg_lambda': 0.21351345458168183, 'subsample': 0.6527034513502582, 'boosting_type': 'gbdt', 'min_child_samples': 11, 'num_leaves': 156, 'colsample_bytree': 0.5702154875812782}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8139976786239942
45 trials complete


[32m[I 2021-09-23 11:35:36,141][0m Trial 45 finished with value: 0.8141063396095715 and parameters: {'n_estimators': 4011, 'depth': 9, 'learning_rate': 0.017316360492641326, 'reg_alpha': 10.288085787583196, 'reg_lambda': 6.155535957564162, 'subsample': 0.7364978801629282, 'boosting_type': 'gbdt', 'min_child_samples': 45, 'num_leaves': 195, 'colsample_bytree': 0.6784411343152769}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8141063396095715


[32m[I 2021-09-23 11:41:42,118][0m Trial 46 finished with value: 0.7966354823754607 and parameters: {'n_estimators': 2734, 'depth': 10, 'learning_rate': 0.3419635972120538, 'reg_alpha': 0.5636980050632224, 'reg_lambda': 0.018185253656445226, 'subsample': 0.6664583335903539, 'boosting_type': 'gbdt', 'min_child_samples': 6, 'num_leaves': 139, 'colsample_bytree': 0.5184797451586786}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.7966354823754607


[32m[I 2021-09-23 11:46:54,797][0m Trial 47 finished with value: 0.8147804697229194 and parameters: {'n_estimators': 4228, 'depth': 6, 'learning_rate': 0.007374335354095762, 'reg_alpha': 3.99370445367381, 'reg_lambda': 0.05591066223816827, 'subsample': 0.7074917850284995, 'boosting_type': 'gbdt', 'min_child_samples': 16, 'num_leaves': 120, 'colsample_bytree': 0.7413628964094082}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8147804697229194


[32m[I 2021-09-23 12:09:07,575][0m Trial 48 finished with value: 0.813444522896126 and parameters: {'n_estimators': 3726, 'depth': 8, 'learning_rate': 0.021906465773311352, 'reg_alpha': 28.714030300984852, 'reg_lambda': 0.43559141606553625, 'subsample': 0.6449566488676258, 'boosting_type': 'dart', 'min_child_samples': 27, 'num_leaves': 152, 'colsample_bytree': 0.5490945052097663}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.813444522896126


[32m[I 2021-09-23 12:10:53,721][0m Trial 49 finished with value: 0.8147352037826713 and parameters: {'n_estimators': 3333, 'depth': 5, 'learning_rate': 0.013285342062402014, 'reg_alpha': 7.566871496371898, 'reg_lambda': 0.8790795628454507, 'subsample': 0.5676975119606613, 'boosting_type': 'goss', 'min_child_samples': 4, 'num_leaves': 109, 'colsample_bytree': 0.5876196887437328}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8147352037826713
50 trials complete


[32m[I 2021-09-23 12:18:43,635][0m Trial 50 finished with value: 0.8130315265677364 and parameters: {'n_estimators': 2920, 'depth': 9, 'learning_rate': 0.03378917586447508, 'reg_alpha': 19.553505079563504, 'reg_lambda': 0.002386021880582869, 'subsample': 0.5950891441417506, 'boosting_type': 'gbdt', 'min_child_samples': 10, 'num_leaves': 170, 'colsample_bytree': 0.6379604297033814}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8130315265677364


[32m[I 2021-09-23 12:24:27,762][0m Trial 51 finished with value: 0.8150057336278549 and parameters: {'n_estimators': 3169, 'depth': 9, 'learning_rate': 0.008869034791972801, 'reg_alpha': 5.868671678649466, 'reg_lambda': 0.7534701774098215, 'subsample': 0.6117184611476366, 'boosting_type': 'gbdt', 'min_child_samples': 7, 'num_leaves': 125, 'colsample_bytree': 0.6173556102195726}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8150057336278549


[32m[I 2021-09-23 12:31:46,765][0m Trial 52 finished with value: 0.8008804408975426 and parameters: {'n_estimators': 3520, 'depth': 10, 'learning_rate': 0.21839949391273178, 'reg_alpha': 11.787306743942642, 'reg_lambda': 0.13862981047505857, 'subsample': 0.52890966298594, 'boosting_type': 'gbdt', 'min_child_samples': 8, 'num_leaves': 140, 'colsample_bytree': 0.6144602219052896}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8008804408975426


[32m[I 2021-09-23 12:38:23,897][0m Trial 53 finished with value: 0.8147455212513226 and parameters: {'n_estimators': 3355, 'depth': 8, 'learning_rate': 0.00639819316131357, 'reg_alpha': 0.016041578526914204, 'reg_lambda': 0.22794876533442218, 'subsample': 0.6828998147313176, 'boosting_type': 'gbdt', 'min_child_samples': 13, 'num_leaves': 124, 'colsample_bytree': 0.5760661096931676}. Best is trial 10 with value: 0.8152310287561186.[0m


ROC AUC Score of XGBoost = 0.8147455212513226


[32m[I 2021-09-23 12:44:35,923][0m Trial 54 finished with value: 0.8154218474454626 and parameters: {'n_estimators': 3768, 'depth': 9, 'learning_rate': 0.010233384527490822, 'reg_alpha': 5.666877514598042, 'reg_lambda': 29.358511606519556, 'subsample': 0.5913679590879073, 'boosting_type': 'gbdt', 'min_child_samples': 21, 'num_leaves': 102, 'colsample_bytree': 0.5179917076284164}. Best is trial 54 with value: 0.8154218474454626.[0m


ROC AUC Score of XGBoost = 0.8154218474454626
55 trials complete


[32m[I 2021-09-23 12:49:20,875][0m Trial 55 finished with value: 0.8150298885150724 and parameters: {'n_estimators': 3808, 'depth': 8, 'learning_rate': 0.015415368148280987, 'reg_alpha': 2.0392340417384816, 'reg_lambda': 29.550772172580615, 'subsample': 0.6228803479112983, 'boosting_type': 'gbdt', 'min_child_samples': 22, 'num_leaves': 102, 'colsample_bytree': 0.5002943651073549}. Best is trial 54 with value: 0.8154218474454626.[0m


ROC AUC Score of XGBoost = 0.8150298885150724


[32m[I 2021-09-23 12:55:26,495][0m Trial 56 finished with value: 0.8141048404494805 and parameters: {'n_estimators': 3799, 'depth': 9, 'learning_rate': 0.026670074567918797, 'reg_alpha': 2.278600607449601, 'reg_lambda': 28.789569480034565, 'subsample': 0.6296983297419415, 'boosting_type': 'gbdt', 'min_child_samples': 21, 'num_leaves': 86, 'colsample_bytree': 0.5174003839821418}. Best is trial 54 with value: 0.8154218474454626.[0m


ROC AUC Score of XGBoost = 0.8141048404494805


[32m[I 2021-09-23 13:03:07,187][0m Trial 57 finished with value: 0.815569115836393 and parameters: {'n_estimators': 4080, 'depth': 7, 'learning_rate': 0.015661698750565334, 'reg_alpha': 21.657478406064467, 'reg_lambda': 4.7196927032311375, 'subsample': 0.6583469802928689, 'boosting_type': 'gbdt', 'min_child_samples': 33, 'num_leaves': 75, 'colsample_bytree': 0.5004942118860025}. Best is trial 57 with value: 0.815569115836393.[0m


ROC AUC Score of XGBoost = 0.815569115836393


[32m[I 2021-09-23 13:09:03,565][0m Trial 58 finished with value: 0.815526106221949 and parameters: {'n_estimators': 4275, 'depth': 6, 'learning_rate': 0.01818616199318113, 'reg_alpha': 12.142290038850012, 'reg_lambda': 7.554319798526443, 'subsample': 0.6992528804565766, 'boosting_type': 'gbdt', 'min_child_samples': 35, 'num_leaves': 55, 'colsample_bytree': 0.5205628485230431}. Best is trial 57 with value: 0.815569115836393.[0m


ROC AUC Score of XGBoost = 0.815526106221949


[32m[I 2021-09-23 13:13:22,702][0m Trial 59 finished with value: 0.8155243306553419 and parameters: {'n_estimators': 4315, 'depth': 6, 'learning_rate': 0.01996209557451632, 'reg_alpha': 20.92325034404242, 'reg_lambda': 4.394333157745482, 'subsample': 0.7269586972618948, 'boosting_type': 'gbdt', 'min_child_samples': 37, 'num_leaves': 51, 'colsample_bytree': 0.5255752208383068}. Best is trial 57 with value: 0.815569115836393.[0m


ROC AUC Score of XGBoost = 0.8155243306553419
60 trials complete


[32m[I 2021-09-23 13:19:02,489][0m Trial 60 finished with value: 0.814233985699786 and parameters: {'n_estimators': 4495, 'depth': 4, 'learning_rate': 0.06116913166935056, 'reg_alpha': 0.10136102629680761, 'reg_lambda': 4.276096850762959, 'subsample': 0.8017001572144496, 'boosting_type': 'gbdt', 'min_child_samples': 36, 'num_leaves': 58, 'colsample_bytree': 0.5294218171384942}. Best is trial 57 with value: 0.815569115836393.[0m


ROC AUC Score of XGBoost = 0.814233985699786


[32m[I 2021-09-23 13:23:32,325][0m Trial 61 finished with value: 0.8153535136301533 and parameters: {'n_estimators': 4257, 'depth': 6, 'learning_rate': 0.019701770341545775, 'reg_alpha': 23.379521246085314, 'reg_lambda': 12.086436365209064, 'subsample': 0.730169769149642, 'boosting_type': 'gbdt', 'min_child_samples': 41, 'num_leaves': 65, 'colsample_bytree': 0.5495586039296456}. Best is trial 57 with value: 0.815569115836393.[0m


ROC AUC Score of XGBoost = 0.8153535136301533


[32m[I 2021-09-23 13:28:00,786][0m Trial 62 finished with value: 0.8153931506447742 and parameters: {'n_estimators': 4287, 'depth': 6, 'learning_rate': 0.019816863400061807, 'reg_alpha': 23.35230363277317, 'reg_lambda': 12.888441599139876, 'subsample': 0.7324082647748, 'boosting_type': 'gbdt', 'min_child_samples': 41, 'num_leaves': 51, 'colsample_bytree': 0.5501220877681949}. Best is trial 57 with value: 0.815569115836393.[0m


ROC AUC Score of XGBoost = 0.8153931506447742


[32m[I 2021-09-23 13:34:44,879][0m Trial 63 finished with value: 0.8154763011703237 and parameters: {'n_estimators': 4274, 'depth': 6, 'learning_rate': 0.01978348071317367, 'reg_alpha': 21.035393264708542, 'reg_lambda': 13.799435025295711, 'subsample': 0.7687457037380415, 'boosting_type': 'gbdt', 'min_child_samples': 41, 'num_leaves': 50, 'colsample_bytree': 0.5193081989557434}. Best is trial 57 with value: 0.815569115836393.[0m


ROC AUC Score of XGBoost = 0.8154763011703237


[32m[I 2021-09-23 13:38:52,085][0m Trial 64 finished with value: 0.8155880487420302 and parameters: {'n_estimators': 4130, 'depth': 6, 'learning_rate': 0.020543150478389692, 'reg_alpha': 21.246664989689418, 'reg_lambda': 11.99745289059057, 'subsample': 0.7644548710357131, 'boosting_type': 'gbdt', 'min_child_samples': 41, 'num_leaves': 51, 'colsample_bytree': 0.5202601921080291}. Best is trial 64 with value: 0.8155880487420302.[0m


ROC AUC Score of XGBoost = 0.8155880487420302
65 trials complete


[32m[I 2021-09-23 13:41:52,100][0m Trial 65 finished with value: 0.8150940425674905 and parameters: {'n_estimators': 4113, 'depth': 5, 'learning_rate': 0.033839530422281425, 'reg_alpha': 8.01204698779487, 'reg_lambda': 7.784637408565759, 'subsample': 0.7941477879914267, 'boosting_type': 'gbdt', 'min_child_samples': 50, 'num_leaves': 50, 'colsample_bytree': 0.5218631151980587}. Best is trial 64 with value: 0.8155880487420302.[0m


ROC AUC Score of XGBoost = 0.8150940425674905


[32m[I 2021-09-23 13:47:56,063][0m Trial 66 finished with value: 0.8150474255778118 and parameters: {'n_estimators': 4392, 'depth': 6, 'learning_rate': 0.026578637355606127, 'reg_alpha': 11.725130278018142, 'reg_lambda': 19.39846195476265, 'subsample': 0.7651760742170615, 'boosting_type': 'gbdt', 'min_child_samples': 33, 'num_leaves': 73, 'colsample_bytree': 0.5146864090829721}. Best is trial 64 with value: 0.8155880487420302.[0m


ROC AUC Score of XGBoost = 0.8150474255778118


[32m[I 2021-09-23 13:53:55,250][0m Trial 67 finished with value: 0.8141959226211244 and parameters: {'n_estimators': 4080, 'depth': 5, 'learning_rate': 0.052024616738880806, 'reg_alpha': 24.205390254029435, 'reg_lambda': 3.7496860207278324, 'subsample': 0.7527417325781307, 'boosting_type': 'gbdt', 'min_child_samples': 41, 'num_leaves': 64, 'colsample_bytree': 0.5310443562714581}. Best is trial 64 with value: 0.8155880487420302.[0m


ROC AUC Score of XGBoost = 0.8141959226211244


[32m[I 2021-09-23 13:58:02,862][0m Trial 68 finished with value: 0.811119211509955 and parameters: {'n_estimators': 3952, 'depth': 6, 'learning_rate': 0.03714155086651255, 'reg_alpha': 29.93991144959574, 'reg_lambda': 20.101458775365977, 'subsample': 0.858843428714956, 'boosting_type': 'goss', 'min_child_samples': 37, 'num_leaves': 54, 'colsample_bytree': 0.5552509851614935}. Best is trial 64 with value: 0.8155880487420302.[0m


ROC AUC Score of XGBoost = 0.811119211509955


[32m[I 2021-09-23 14:13:09,984][0m Trial 69 finished with value: 0.8135724679697248 and parameters: {'n_estimators': 4282, 'depth': 5, 'learning_rate': 0.023088489628210526, 'reg_alpha': 20.76893160922438, 'reg_lambda': 10.585699367116293, 'subsample': 0.7772597498167529, 'boosting_type': 'dart', 'min_child_samples': 44, 'num_leaves': 76, 'colsample_bytree': 0.5042948866937692}. Best is trial 64 with value: 0.8155880487420302.[0m


ROC AUC Score of XGBoost = 0.8135724679697248
70 trials complete


[32m[I 2021-09-23 14:20:26,050][0m Trial 70 finished with value: 0.8150238235436559 and parameters: {'n_estimators': 4230, 'depth': 7, 'learning_rate': 0.016069487628562074, 'reg_alpha': 4.929588976315441, 'reg_lambda': 6.30191783281364, 'subsample': 0.7028426730142961, 'boosting_type': 'gbdt', 'min_child_samples': 30, 'num_leaves': 63, 'colsample_bytree': 0.5393228905416919}. Best is trial 64 with value: 0.8155880487420302.[0m


ROC AUC Score of XGBoost = 0.8150238235436559


[32m[I 2021-09-23 14:28:04,782][0m Trial 71 finished with value: 0.8153326674550253 and parameters: {'n_estimators': 4189, 'depth': 6, 'learning_rate': 0.019938554614182567, 'reg_alpha': 12.769025545113637, 'reg_lambda': 12.184952581834816, 'subsample': 0.7267028978432495, 'boosting_type': 'gbdt', 'min_child_samples': 41, 'num_leaves': 66, 'colsample_bytree': 0.5585605193724144}. Best is trial 64 with value: 0.8155880487420302.[0m


ROC AUC Score of XGBoost = 0.8153326674550253


[32m[I 2021-09-23 14:32:43,597][0m Trial 72 finished with value: 0.8156459279862528 and parameters: {'n_estimators': 4323, 'depth': 5, 'learning_rate': 0.021200050859660396, 'reg_alpha': 19.077546889417995, 'reg_lambda': 16.146057988110698, 'subsample': 0.7339336190557773, 'boosting_type': 'gbdt', 'min_child_samples': 46, 'num_leaves': 55, 'colsample_bytree': 0.5461401272955946}. Best is trial 72 with value: 0.8156459279862528.[0m


ROC AUC Score of XGBoost = 0.8156459279862528


[32m[I 2021-09-23 14:36:00,573][0m Trial 73 finished with value: 0.8156128505926237 and parameters: {'n_estimators': 4379, 'depth': 4, 'learning_rate': 0.02797895637976835, 'reg_alpha': 8.449269489808252, 'reg_lambda': 16.305009941235667, 'subsample': 0.7835667333701517, 'boosting_type': 'gbdt', 'min_child_samples': 48, 'num_leaves': 51, 'colsample_bytree': 0.5767174801254707}. Best is trial 72 with value: 0.8156459279862528.[0m


ROC AUC Score of XGBoost = 0.8156128505926237


[32m[I 2021-09-23 14:38:20,619][0m Trial 74 finished with value: 0.8156750636348244 and parameters: {'n_estimators': 4409, 'depth': 3, 'learning_rate': 0.03038569562151494, 'reg_alpha': 7.38712124251796, 'reg_lambda': 17.567912166658807, 'subsample': 0.8223236259802937, 'boosting_type': 'gbdt', 'min_child_samples': 47, 'num_leaves': 57, 'colsample_bytree': 0.576249287463262}. Best is trial 74 with value: 0.8156750636348244.[0m


ROC AUC Score of XGBoost = 0.8156750636348244
75 trials complete


[32m[I 2021-09-23 14:42:32,957][0m Trial 75 finished with value: 0.8157219144391968 and parameters: {'n_estimators': 4429, 'depth': 3, 'learning_rate': 0.02952568423554658, 'reg_alpha': 9.285152197932742, 'reg_lambda': 7.784744078293992, 'subsample': 0.8628511640697093, 'boosting_type': 'gbdt', 'min_child_samples': 47, 'num_leaves': 57, 'colsample_bytree': 0.573325963741589}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8157219144391968


[32m[I 2021-09-23 14:44:57,512][0m Trial 76 finished with value: 0.8156500482647007 and parameters: {'n_estimators': 4407, 'depth': 3, 'learning_rate': 0.050440154358050285, 'reg_alpha': 9.037031276805386, 'reg_lambda': 3.5000486733487888, 'subsample': 0.8423419666876018, 'boosting_type': 'gbdt', 'min_child_samples': 55, 'num_leaves': 59, 'colsample_bytree': 0.5967187464681443}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8156500482647007


[32m[I 2021-09-23 14:47:00,139][0m Trial 77 finished with value: 0.8149918391666693 and parameters: {'n_estimators': 4447, 'depth': 3, 'learning_rate': 0.08197863659533366, 'reg_alpha': 9.424286208141345, 'reg_lambda': 3.1595514253658754, 'subsample': 0.8740748374198333, 'boosting_type': 'gbdt', 'min_child_samples': 53, 'num_leaves': 59, 'colsample_bytree': 0.5862233176244588}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8149918391666693


[32m[I 2021-09-23 14:50:09,860][0m Trial 78 finished with value: 0.8134021263797553 and parameters: {'n_estimators': 4400, 'depth': 4, 'learning_rate': 0.07522484164587954, 'reg_alpha': 3.446184910457573, 'reg_lambda': 7.575326620458662, 'subsample': 0.8234161084845607, 'boosting_type': 'gbdt', 'min_child_samples': 58, 'num_leaves': 81, 'colsample_bytree': 0.5831137461069004}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8134021263797553


[32m[I 2021-09-23 14:52:26,429][0m Trial 79 finished with value: 0.8155874959289984 and parameters: {'n_estimators': 3994, 'depth': 3, 'learning_rate': 0.053453428283297084, 'reg_alpha': 7.931237920175674, 'reg_lambda': 20.577710704988142, 'subsample': 0.8973532965453676, 'boosting_type': 'gbdt', 'min_child_samples': 47, 'num_leaves': 69, 'colsample_bytree': 0.6000936095824673}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8155874959289984
80 trials complete


[32m[I 2021-09-23 14:54:15,068][0m Trial 80 finished with value: 0.8156888720717373 and parameters: {'n_estimators': 3977, 'depth': 3, 'learning_rate': 0.05653278068192062, 'reg_alpha': 7.8874631765552214, 'reg_lambda': 18.565987377085847, 'subsample': 0.9352683982884042, 'boosting_type': 'gbdt', 'min_child_samples': 48, 'num_leaves': 71, 'colsample_bytree': 0.5985995413879266}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8156888720717373


[32m[I 2021-09-23 14:56:06,020][0m Trial 81 finished with value: 0.8145862192695479 and parameters: {'n_estimators': 4006, 'depth': 3, 'learning_rate': 0.10187392950474047, 'reg_alpha': 7.7807437574862055, 'reg_lambda': 17.9588312848054, 'subsample': 0.9204860184804153, 'boosting_type': 'gbdt', 'min_child_samples': 47, 'num_leaves': 69, 'colsample_bytree': 0.5667100097696274}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8145862192695479


[32m[I 2021-09-23 14:57:49,192][0m Trial 82 finished with value: 0.8157089104833485 and parameters: {'n_estimators': 3928, 'depth': 3, 'learning_rate': 0.05093706004812599, 'reg_alpha': 1.4050109113701448, 'reg_lambda': 23.383099717263306, 'subsample': 0.8756836361682607, 'boosting_type': 'gbdt', 'min_child_samples': 49, 'num_leaves': 77, 'colsample_bytree': 0.6011083652932999}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8157089104833485


[32m[I 2021-09-23 14:59:31,083][0m Trial 83 finished with value: 0.8156233915882822 and parameters: {'n_estimators': 3919, 'depth': 3, 'learning_rate': 0.0495044219270338, 'reg_alpha': 4.282582725672136, 'reg_lambda': 23.56123161302528, 'subsample': 0.9066911993371677, 'boosting_type': 'gbdt', 'min_child_samples': 49, 'num_leaves': 80, 'colsample_bytree': 0.6023015819239279}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8156233915882822


[32m[I 2021-09-23 15:01:45,385][0m Trial 84 finished with value: 0.8153064651981243 and parameters: {'n_estimators': 3909, 'depth': 4, 'learning_rate': 0.04075547109441111, 'reg_alpha': 4.139077325617311, 'reg_lambda': 9.172697147012956, 'subsample': 0.9407559900066769, 'boosting_type': 'gbdt', 'min_child_samples': 50, 'num_leaves': 83, 'colsample_bytree': 0.600525494438434}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8153064651981243
85 trials complete


[32m[I 2021-09-23 15:02:38,142][0m Trial 85 finished with value: 0.8154724046190325 and parameters: {'n_estimators': 1943, 'depth': 3, 'learning_rate': 0.06531340739788383, 'reg_alpha': 3.0480487168962673, 'reg_lambda': 16.320373006852908, 'subsample': 0.8598259711459427, 'boosting_type': 'gbdt', 'min_child_samples': 55, 'num_leaves': 61, 'colsample_bytree': 0.6272445325805097}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8154724046190325


[32m[I 2021-09-23 15:13:52,039][0m Trial 86 finished with value: 0.8141281983812565 and parameters: {'n_estimators': 4146, 'depth': 4, 'learning_rate': 0.09242839147800326, 'reg_alpha': 1.3313998318992382, 'reg_lambda': 24.848257849247133, 'subsample': 0.8941904477112065, 'boosting_type': 'dart', 'min_child_samples': 49, 'num_leaves': 91, 'colsample_bytree': 0.6642354229612036}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8141281983812565


[32m[I 2021-09-23 15:15:39,269][0m Trial 87 finished with value: 0.8142581951477685 and parameters: {'n_estimators': 4367, 'depth': 3, 'learning_rate': 0.047592837768091534, 'reg_alpha': 2.6961238191340158, 'reg_lambda': 9.868800468978371, 'subsample': 0.8395677617212493, 'boosting_type': 'goss', 'min_child_samples': 52, 'num_leaves': 79, 'colsample_bytree': 0.6384517446396001}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8142581951477685


[32m[I 2021-09-23 15:20:01,270][0m Trial 88 finished with value: 0.8100441789040739 and parameters: {'n_estimators': 4484, 'depth': 4, 'learning_rate': 0.13584834629138098, 'reg_alpha': 4.797656455289755, 'reg_lambda': 2.2700195714363045, 'subsample': 0.9716778769677631, 'boosting_type': 'gbdt', 'min_child_samples': 46, 'num_leaves': 59, 'colsample_bytree': 0.5771654037588235}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8100441789040739


[32m[I 2021-09-23 15:22:22,062][0m Trial 89 finished with value: 0.8156193930808151 and parameters: {'n_estimators': 4180, 'depth': 3, 'learning_rate': 0.03020621257716461, 'reg_alpha': 14.985602993060041, 'reg_lambda': 5.76106747862505, 'subsample': 0.9129102789773111, 'boosting_type': 'gbdt', 'min_child_samples': 43, 'num_leaves': 69, 'colsample_bytree': 0.9504996349100717}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8156193930808151
90 trials complete


[32m[I 2021-09-23 15:22:58,295][0m Trial 90 finished with value: 0.813675037524116 and parameters: {'n_estimators': 1249, 'depth': 3, 'learning_rate': 0.03118245902443823, 'reg_alpha': 0.3438212325656988, 'reg_lambda': 5.664754675706434, 'subsample': 0.9172009467869863, 'boosting_type': 'gbdt', 'min_child_samples': 44, 'num_leaves': 87, 'colsample_bytree': 0.5954454594975628}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.813675037524116


[32m[I 2021-09-23 15:26:17,279][0m Trial 91 finished with value: 0.8153047872644636 and parameters: {'n_estimators': 4164, 'depth': 4, 'learning_rate': 0.03760041816694198, 'reg_alpha': 14.662242950292233, 'reg_lambda': 21.109923295106235, 'subsample': 0.8803478660491111, 'boosting_type': 'gbdt', 'min_child_samples': 55, 'num_leaves': 70, 'colsample_bytree': 0.9456772795966897}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8153047872644636


[32m[I 2021-09-23 15:28:33,509][0m Trial 92 finished with value: 0.8154594337278883 and parameters: {'n_estimators': 4373, 'depth': 3, 'learning_rate': 0.02691844120240025, 'reg_alpha': 6.29025689880095, 'reg_lambda': 15.724240125727162, 'subsample': 0.9240425865308759, 'boosting_type': 'gbdt', 'min_child_samples': 60, 'num_leaves': 56, 'colsample_bytree': 0.8602968898016949}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8154594337278883


[32m[I 2021-09-23 15:31:22,337][0m Trial 93 finished with value: 0.8156364760843058 and parameters: {'n_estimators': 4062, 'depth': 3, 'learning_rate': 0.05062326897033488, 'reg_alpha': 9.700905506286727, 'reg_lambda': 23.372218653513894, 'subsample': 0.847634891273144, 'boosting_type': 'gbdt', 'min_child_samples': 48, 'num_leaves': 66, 'colsample_bytree': 0.8994149063697776}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8156364760843058


[32m[I 2021-09-23 15:35:19,966][0m Trial 94 finished with value: 0.8156465965657792 and parameters: {'n_estimators': 4026, 'depth': 3, 'learning_rate': 0.04989282984575652, 'reg_alpha': 9.842040283375686, 'reg_lambda': 25.391506029381006, 'subsample': 0.8522991317741261, 'boosting_type': 'gbdt', 'min_child_samples': 48, 'num_leaves': 67, 'colsample_bytree': 0.9385338747540019}. Best is trial 75 with value: 0.8157219144391968.[0m


ROC AUC Score of XGBoost = 0.8156465965657792
95 trials complete


In [18]:
dump(study, filename=datapath/'optuna_lightgbm_100trials-complete_20210922.joblib')
dump(study.best_trial.params, filename=datapath/'optuna_lightgbm_all-100trials-best_20210922.joblib')
# pickle.dump(study.best_trial.params, open('CatBoost_Hyperparameter.pickle', 'wb'))
# print('CatBoost Hyperparameter:', study.best_trial.params)

['/media/sf/easystore/kaggle_data/tabular_playgrounds/sep2021/optuna_lightgbm_all-100trials-best_20210922.joblib']

In [19]:
study.best_trial.params

{'n_estimators': 4429,
 'depth': 3,
 'learning_rate': 0.02952568423554658,
 'reg_alpha': 9.285152197932742,
 'reg_lambda': 7.784744078293992,
 'subsample': 0.8628511640697093,
 'boosting_type': 'gbdt',
 'min_child_samples': 47,
 'num_leaves': 57,
 'colsample_bytree': 0.573325963741589}

In [20]:
wandb.log({'lightgbm_params': study.best_trial.params})
wandb.finish()

VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

0,1
valid_auc,0.81565


0,1
valid_auc,▅▆▅▁▁▇▇▇▇█▇▅▇█▇▄▇▆▇▇▇▆▇██▇██▇▇████▇█▇███
