# Model training

## Settings

In [1]:
%load_ext autoreload

In [2]:
%autoreload 2

In [3]:
import helpers.settings as sts
sts.print_settings(sts)

[1m[91mBEST_ESTIMATOR_FILENAME : best_estimator_0.0.1.pkl
[1m[91mDATASET_TRAIN_FILENAME : dataset_train.parquet
[1m[91mDATASET_VALIDATION_FILENAME : dataset_validation.parquet
[1m[91mETL_VERSION : 0.0.1
[1m[91mMODEL_FILENAME : model_0.0.1.pkl
[1m[91mMODEL_VERSION : 0.0.1
[1m[91mPREPROCESSOR_FILENAME : preprocessor_0.0.1.pkl
[1m[91mTRAINED_BEST_ESTIMATOR_FILENAME : trained_best_estimator_0.0.1.pkl
[1m[91mcolor : <class 'helpers.settings.color'>
[1m[91mprint_settings : <function print_settings at 0x7fa094aaac10>
[0m


## Imports

In [4]:
import pickle
import pandas as pd
import numpy as np
from sklearn.metrics import (
    classification_report,
    plot_precision_recall_curve,
    precision_recall_curve,
    average_precision_score,
)
from sklearn.model_selection import RandomizedSearchCV
from xgboost import XGBClassifier
from lightgbm import LGBMClassifier
from sklearn.pipeline import Pipeline
from sklearn.ensemble import RandomForestClassifier
from scipy.stats import randint as sp_randint
import shap

## Load train dataset

In [5]:
df_train = pd.read_parquet(f"data/{sts.DATASET_TRAIN_FILENAME}")

In [6]:
X_train = df_train.iloc[:,:-1]
y_train = df_train.iloc[:,-1]

## Best estimator param grid

In [7]:
estimators = [
    {
        "clf": [RandomForestClassifier()],
        "clf__bootstrap": [True, False],
        "clf__max_depth": [10, 20, 30, 40, 50, 60, 70, 80, 90, 100, None],
        "clf__max_features": ["auto", "sqrt"],
        "clf__min_samples_leaf": [1, 2, 4],
        "clf__min_samples_split": [2, 5, 10],
        "clf__n_estimators": [100, 200, 400, 500]
    },
    {
        "clf": [XGBClassifier()],
        "clf__objective": ["binary:logistic"],
        "clf__use_label_encoder": [False],
        "clf__eval_metric": ["logloss"],
        "clf__learning_rate": [0.0001, 0.001, 0.01, 0.1, 0.2, 0.3],
        "clf__min_child_weight": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10],
        "clf__gamma": [0.5, 1, 1.5, 2, 5],
        "clf__subsample": np.random.uniform(1, .7, 1),
        "clf__colsample_bytree": [ 0.3, 0.4, 0.5 , 0.7 ],
        "clf__max_depth": [3, 4, 5, 6, 7, 8],
        "clf__n_estimators": np.arange(100, 500, 10),
        
    },
    {
        "clf": [LGBMClassifier()],
        "clf__num_leaves": sp_randint(6, 50), 
        "clf__min_child_samples": sp_randint(100, 500), 
        "clf__min_child_weight": [1e-5, 1e-3, 1e-2, 1e-1, 1, 1e1, 1e2, 1e3, 1e4],
        "clf__subsample": np.random.uniform(0.2, 0.8, 1), 
        "clf__colsample_bytree": np.random.uniform(0.4, 0.6, 1),
        "clf__reg_alpha": [0, 1e-1, 1, 2, 5, 7, 10, 50, 100],
        "clf__reg_lambda": [0, 1e-1, 1, 5, 10, 20, 50, 100],
    },  
]

## Load best estimator

In [8]:
with open(f"artifacts/{sts.BEST_ESTIMATOR_FILENAME}", "rb") as file:
    best_estimator = pickle.load(file)

In [9]:
rs = RandomizedSearchCV(
    best_estimator, 
    estimators, 
    cv=3,
    scoring="average_precision",
    n_jobs=1, 
    verbose=3, 
    n_iter=20, 
    random_state=42,
)

In [10]:
rs.fit(X_train, y_train)

2021-09-01 05:57:30.413610 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
2021-09-01 05:57:30.420473 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


Fitting 3 folds for each of 20 candidates, totalling 60 fits
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=448, clf__min_child_weight=1000.0, clf__num_leaves=26, clf__reg_alpha=10, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386 
[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=448, clf__min_child_weight=1000.0, clf__num_leaves=26, clf__reg_alpha=10, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386, score=0.013, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=448, clf__min_child_weight=1000.0, clf__num_leaves=26, clf__reg_alpha=10, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386 


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.4s remaining:    0.0s
2021-09-01 05:57:30.790227 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=448, clf__min_child_weight=1000.0, clf__num_leaves=26, clf__reg_alpha=10, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386, score=0.013, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=448, clf__min_child_weight=1000.0, clf__num_leaves=26, clf__reg_alpha=10, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386 


[Parallel(n_jobs=1)]: Done   2 out of   2 | elapsed:    0.8s remaining:    0.0s
2021-09-01 05:57:31.180367 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=448, clf__min_child_weight=1000.0, clf__num_leaves=26, clf__reg_alpha=10, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386, score=0.013, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=314, clf__min_child_weight=1000.0, clf__num_leaves=41, clf__reg_alpha=50, clf__reg_lambda=100, clf__subsample=0.40181578955992386 


2021-09-01 05:57:31.572540 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=314, clf__min_child_weight=1000.0, clf__num_leaves=41, clf__reg_alpha=50, clf__reg_lambda=100, clf__subsample=0.40181578955992386, score=0.013, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=314, clf__min_child_weight=1000.0, clf__num_leaves=41, clf__reg_alpha=50, clf__reg_lambda=100, clf__subsample=0.40181578955992386 


2021-09-01 05:57:31.961938 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=314, clf__min_child_weight=1000.0, clf__num_leaves=41, clf__reg_alpha=50, clf__reg_lambda=100, clf__subsample=0.40181578955992386, score=0.013, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=314, clf__min_child_weight=1000.0, clf__num_leaves=41, clf__reg_alpha=50, clf__reg_lambda=100, clf__subsample=0.40181578955992386 


2021-09-01 05:57:32.350957 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=314, clf__min_child_weight=1000.0, clf__num_leaves=41, clf__reg_alpha=50, clf__reg_lambda=100, clf__subsample=0.40181578955992386, score=0.013, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=249, clf__min_child_weight=1, clf__num_leaves=7, clf__reg_alpha=50, clf__reg_lambda=5, clf__subsample=0.40181578955992386 


2021-09-01 05:57:32.775183 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=249, clf__min_child_weight=1, clf__num_leaves=7, clf__reg_alpha=50, clf__reg_lambda=5, clf__subsample=0.40181578955992386, score=0.013, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=249, clf__min_child_weight=1, clf__num_leaves=7, clf__reg_alpha=50, clf__reg_lambda=5, clf__subsample=0.40181578955992386 


2021-09-01 05:57:33.162606 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=249, clf__min_child_weight=1, clf__num_leaves=7, clf__reg_alpha=50, clf__reg_lambda=5, clf__subsample=0.40181578955992386, score=0.013, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=249, clf__min_child_weight=1, clf__num_leaves=7, clf__reg_alpha=50, clf__reg_lambda=5, clf__subsample=0.40181578955992386 


2021-09-01 05:57:33.542163 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=249, clf__min_child_weight=1, clf__num_leaves=7, clf__reg_alpha=50, clf__reg_lambda=5, clf__subsample=0.40181578955992386, score=0.013, total=   0.4s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.1, clf__max_depth=7, clf__m

2021-09-01 05:57:33.926226 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.1, clf__max_depth=7, clf__min_child_weight=1, clf__n_estimators=210, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.791, total=   1.2s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:57:35.158811 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.1, clf__max_depth=7, clf__min_child_weight=1, clf__n_estimators=210, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.686, total=   1.2s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:57:36.412164 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.1, clf__max_depth=7, clf__min_child_weight=1, clf__n_estimators=210, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.762, total=   1.3s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:57:37.668773 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=5, clf__learning_rate=0.1, clf__max_depth=3, clf__min_child_weight=1, clf__n_estimators=360, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.491, total=   1.2s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:57:38.826858 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=5, clf__learning_rate=0.1, clf__max_depth=3, clf__min_child_weight=1, clf__n_estimators=360, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.380, total=   1.2s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:57:39.995569 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=5, clf__learning_rate=0.1, clf__max_depth=3, clf__min_child_weight=1, clf__n_estimators=360, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.394, total=   1.1s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__mi

2021-09-01 05:57:41.149094 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=269, clf__min_child_weight=0.01, clf__num_leaves=49, clf__reg_alpha=10, clf__reg_lambda=5, clf__subsample=0.40181578955992386, score=0.157, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=269, clf__min_child_weight=0.01, clf__num_leaves=49, clf__reg_alpha=10, clf__reg_lambda=5, clf__subsample=0.40181578955992386 


2021-09-01 05:57:41.564899 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=269, clf__min_child_weight=0.01, clf__num_leaves=49, clf__reg_alpha=10, clf__reg_lambda=5, clf__subsample=0.40181578955992386, score=0.139, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=269, clf__min_child_weight=0.01, clf__num_leaves=49, clf__reg_alpha=10, clf__reg_lambda=5, clf__subsample=0.40181578955992386 


2021-09-01 05:57:41.977824 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=269, clf__min_child_weight=0.01, clf__num_leaves=49, clf__reg_alpha=10, clf__reg_lambda=5, clf__subsample=0.40181578955992386, score=0.149, total=   0.4s
[CV] clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=50, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=100 


2021-09-01 05:57:42.392408 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=50, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=100, score=0.825, total=   1.4s
[CV] clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=50, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=100 


2021-09-01 05:57:43.770622 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=50, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=100, score=0.718, total=   1.3s
[CV] clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=50, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=100 


2021-09-01 05:57:45.110020 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=50, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=100, score=0.779, total=   1.3s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=373, clf__min_child_weight=0.1, clf__num_leaves=30, clf__reg_alpha=0.1, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386 


2021-09-01 05:57:46.405323 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=373, clf__min_child_weight=0.1, clf__num_leaves=30, clf__reg_alpha=0.1, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386, score=0.683, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=373, clf__min_child_weight=0.1, clf__num_leaves=30, clf__reg_alpha=0.1, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386 


2021-09-01 05:57:46.824325 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=373, clf__min_child_weight=0.1, clf__num_leaves=30, clf__reg_alpha=0.1, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386, score=0.616, total=   0.5s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=373, clf__min_child_weight=0.1, clf__num_leaves=30, clf__reg_alpha=0.1, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386 


2021-09-01 05:57:47.284627 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=373, clf__min_child_weight=0.1, clf__num_leaves=30, clf__reg_alpha=0.1, clf__reg_lambda=0.1, clf__subsample=0.40181578955992386, score=0.688, total=   0.5s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=50, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=500 


2021-09-01 05:57:47.747665 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=50, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=500, score=0.853, total=   7.0s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=50, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=500 


2021-09-01 05:57:54.721850 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=50, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=500, score=0.755, total=   6.8s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=50, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=500 


2021-09-01 05:58:01.484027 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=50, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=500, score=0.826, total=   6.6s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=sqrt, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=500 


2021-09-01 05:58:08.121486 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=sqrt, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=500, score=0.886, total=   6.9s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=sqrt, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=500 


2021-09-01 05:58:15.035775 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=sqrt, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=500, score=0.811, total=   6.9s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=sqrt, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=500 


2021-09-01 05:58:21.913299 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=sqrt, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=500, score=0.871, total=   6.6s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.1, clf__max_depth=8, clf__min_child_weight=2, clf__n_estimators=350,

2021-09-01 05:58:28.546308 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.1, clf__max_depth=8, clf__min_child_weight=2, clf__n_estimators=350, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.827, total=   1.9s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:58:30.428869 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.1, clf__max_depth=8, clf__min_child_weight=2, clf__n_estimators=350, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.723, total=   2.0s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:58:32.405834 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.1, clf__max_depth=8, clf__min_child_weight=2, clf__n_estimators=350, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.806, total=   1.9s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:58:34.353756 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=2, clf__learning_rate=0.3, clf__max_depth=8, clf__min_child_weight=7, clf__n_estimators=490, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.739, total=   2.3s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:58:36.666292 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=2, clf__learning_rate=0.3, clf__max_depth=8, clf__min_child_weight=7, clf__n_estimators=490, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.657, total=   2.3s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None

2021-09-01 05:58:39.009153 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.4, clf__eval_metric=logloss, clf__gamma=2, clf__learning_rate=0.3, clf__max_depth=8, clf__min_child_weight=7, clf__n_estimators=490, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.702, total=   2.4s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=20, 

2021-09-01 05:58:41.405470 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=20, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=100, score=0.884, total=   1.8s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=20, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=100 


2021-09-01 05:58:43.204059 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=20, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=100, score=0.805, total=   1.6s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=20, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=100 


2021-09-01 05:58:44.831387 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=20, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=5, clf__n_estimators=100, score=0.862, total=   1.6s
[CV] clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=10, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=500 


2021-09-01 05:58:46.415357 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=10, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=500, score=0.648, total=   5.3s
[CV] clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=10, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=500 


2021-09-01 05:58:51.684865 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=10, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=500, score=0.570, total=   5.3s
[CV] clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=10, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=500 


2021-09-01 05:58:57.035595 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=True, clf__max_depth=10, clf__max_features=auto, clf__min_samples_leaf=4, clf__min_samples_split=2, clf__n_estimators=500, score=0.649, total=   4.9s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=80, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=400 


2021-09-01 05:59:01.902881 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=80, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=400, score=0.852, total=   5.5s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=80, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=400 


2021-09-01 05:59:07.394221 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=80, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=400, score=0.754, total=   5.5s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=80, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=400 


2021-09-01 05:59:12.931749 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=80, clf__max_features=sqrt, clf__min_samples_leaf=4, clf__min_samples_split=10, clf__n_estimators=400, score=0.828, total=   5.4s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=10, clf__n_estimators=100 


2021-09-01 05:59:18.312656 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=10, clf__n_estimators=100, score=0.884, total=   1.6s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=10, clf__n_estimators=100 


2021-09-01 05:59:19.945236 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=10, clf__n_estimators=100, score=0.796, total=   1.7s
[CV] clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=10, clf__n_estimators=100 


2021-09-01 05:59:21.601504 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=RandomForestClassifier(), clf__bootstrap=False, clf__max_depth=30, clf__max_features=auto, clf__min_samples_leaf=1, clf__min_samples_split=10, clf__n_estimators=100, score=0.860, total=   1.6s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.5, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.0001, clf__max_depth=6, clf__min_child_weight=7, clf__n_estimators=

2021-09-01 05:59:23.219186 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.5, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.0001, clf__max_depth=6, clf__min_child_weight=7, clf__n_estimators=180, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.034, total=   0.5s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=N

2021-09-01 05:59:23.750312 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.5, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.0001, clf__max_depth=6, clf__min_child_weight=7, clf__n_estimators=180, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.035, total=   0.6s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=N

2021-09-01 05:59:24.370548 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.5, clf__eval_metric=logloss, clf__gamma=1, clf__learning_rate=0.0001, clf__max_depth=6, clf__min_child_weight=7, clf__n_estimators=180, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.050, total=   0.6s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=N

2021-09-01 05:59:24.986593 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.3, clf__eval_metric=logloss, clf__gamma=5, clf__learning_rate=0.01, clf__max_depth=6, clf__min_child_weight=8, clf__n_estimators=310, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.119, total=   1.1s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=Non

2021-09-01 05:59:26.080433 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.3, clf__eval_metric=logloss, clf__gamma=5, clf__learning_rate=0.01, clf__max_depth=6, clf__min_child_weight=8, clf__n_estimators=310, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.105, total=   1.1s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=Non

2021-09-01 05:59:27.200427 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.3, clf__eval_metric=logloss, clf__gamma=5, clf__learning_rate=0.01, clf__max_depth=6, clf__min_child_weight=8, clf__n_estimators=310, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.143, total=   1.1s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__m

2021-09-01 05:59:28.303488 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=134, clf__min_child_weight=1e-05, clf__num_leaves=40, clf__reg_alpha=5, clf__reg_lambda=50, clf__subsample=0.40181578955992386, score=0.211, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=134, clf__min_child_weight=1e-05, clf__num_leaves=40, clf__reg_alpha=5, clf__reg_lambda=50, clf__subsample=0.40181578955992386 


2021-09-01 05:59:28.750563 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=134, clf__min_child_weight=1e-05, clf__num_leaves=40, clf__reg_alpha=5, clf__reg_lambda=50, clf__subsample=0.40181578955992386, score=0.205, total=   0.4s
[CV] clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=134, clf__min_child_weight=1e-05, clf__num_leaves=40, clf__reg_alpha=5, clf__reg_lambda=50, clf__subsample=0.40181578955992386 


2021-09-01 05:59:29.201136 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=LGBMClassifier(), clf__colsample_bytree=0.5731341767005942, clf__min_child_samples=134, clf__min_child_weight=1e-05, clf__num_leaves=40, clf__reg_alpha=5, clf__reg_lambda=50, clf__subsample=0.40181578955992386, score=0.175, total=   0.4s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.5, clf__eval_metric=logloss, clf__gamma=0.5, clf__learning_rate=0.2, clf__max_depth=4,

2021-09-01 05:59:29.651048 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.5, clf__eval_metric=logloss, clf__gamma=0.5, clf__learning_rate=0.2, clf__max_depth=4, clf__min_child_weight=7, clf__n_estimators=230, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.598, total=   1.1s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=No

2021-09-01 05:59:30.718886 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.5, clf__eval_metric=logloss, clf__gamma=0.5, clf__learning_rate=0.2, clf__max_depth=4, clf__min_child_weight=7, clf__n_estimators=230, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.542, total=   1.0s
[CV] clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=No

2021-09-01 05:59:31.757444 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


[CV]  clf=XGBClassifier(base_score=None, booster=None, colsample_bylevel=None,
              colsample_bynode=None, colsample_bytree=None, gamma=None,
              gpu_id=None, importance_type='gain', interaction_constraints=None,
              learning_rate=None, max_delta_step=None, max_depth=None,
              min_child_weight=None, missing=nan, monotone_constraints=None,
              n_estimators=100, n_jobs=None, num_parallel_tree=None,
              random_state=None, reg_alpha=None, reg_lambda=None,
              scale_pos_weight=None, subsample=None, tree_method=None,
              validate_parameters=None, verbosity=None), clf__colsample_bytree=0.5, clf__eval_metric=logloss, clf__gamma=0.5, clf__learning_rate=0.2, clf__max_depth=4, clf__min_child_weight=7, clf__n_estimators=230, clf__objective=binary:logistic, clf__subsample=0.9007190934314233, clf__use_label_encoder=False, score=0.612, total=   1.1s


[Parallel(n_jobs=1)]: Done  60 out of  60 | elapsed:  2.0min finished
2021-09-01 05:59:32.868032 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
2021-09-01 05:59:32.869940 INFO: Hard mode for the ModifiedColumnTransformer set to True: The initial features are going to be enforced during transformation and fit steps
is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead


RandomizedSearchCV(cv=3,
                   estimator=Pipeline(steps=[('preprocessor',
                                              ModifiedColumnTransformer(categorical_features=['CODE_GENDER',
                                                                                              'FLAG_OWN_CAR',
                                                                                              'FLAG_OWN_REALTY',
                                                                                              'NAME_INCOME_TYPE',
                                                                                              'NAME_EDUCATION_TYPE',
                                                                                              'NAME_FAMILY_STATUS',
                                                                                              'NAME_HOUSING_TYPE',
                                                                                              'FLAG_MOBIL',
           

In [11]:
pd.DataFrame(rs.cv_results_).query("rank_test_score == 1")

Unnamed: 0,mean_fit_time,std_fit_time,mean_score_time,std_score_time,param_clf,param_clf__colsample_bytree,param_clf__min_child_samples,param_clf__min_child_weight,param_clf__num_leaves,param_clf__reg_alpha,...,param_clf__max_features,param_clf__min_samples_leaf,param_clf__min_samples_split,params,split0_test_score,split1_test_score,split2_test_score,mean_test_score,std_test_score,rank_test_score
9,6.375128,0.126052,0.426248,0.001836,"RandomForestClassifier(bootstrap=False, max_de...",,,,,,...,sqrt,1,5,{'clf': RandomForestClassifier(bootstrap=False...,0.886232,0.810797,0.871113,0.856047,0.032587,1


## Dump trained best estimator

In [12]:
with open(f"artifacts/{sts.TRAINED_BEST_ESTIMATOR_FILENAME}","wb") as file:
    pickle.dump(rs.best_estimator_, file)