In [1]:
import numpy as np
import pandas as pd
import lightgbm as lgb
from sklearn.model_selection import GridSearchCV,train_test_split,RandomizedSearchCV
from sklearn.metrics import f1_score, mean_squared_error, log_loss
from sklearn.preprocessing import LabelEncoder

In [2]:
data = pd.read_excel("/usr/input/flipr-hackathon-dataset/Train_dataset.xlsx")

In [3]:
data = data.drop(["Name", "Designation",],axis = 1)
data = data.loc[~data.iloc[:,[1,2,3,5,6,9,12,13,]].isnull().any(axis=1)]
y = data["Infect_Prob"]
data = data.drop(["Infect_Prob"], axis = 1)
#y = (y >= 50).astype("float64")
y /= 100

In [4]:
cat_features = [1,2,3,5,6,9,12,13,]

In [5]:
for i in cat_features:
    le = LabelEncoder()
    data.iloc[:,i] = le.fit_transform(data.iloc[:,i])

In [6]:
X_train, X_test, y_train, y_test = train_test_split(data.values, y, random_state = 42)

param = {"boosting_type":"gbdt","objective":"regression","learning_rate":0.001,"bagging_freq":1,"colsample_bytree":0.8, \
         "min_child_weight":10,"bagging_fraction":0.6,"max_bin":1000,"max_depth":4,"scale_pos_weight":1, \
         "lambda_l1":0.1475,"lambda_l2":0.05185,"min_gain_to_split":0.08,"metric": "mse", "n_threads" : 3,  \
         "n_estimators": 99999, "verbose": 0, "early_stopping_rounds" : 20}

In [7]:
train_data = lgb.Dataset(X_train, label = y_train, categorical_feature=cat_features)
val_data = lgb.Dataset(X_test, label = y_test, categorical_feature=cat_features)

In [8]:
grid_params = {"depth": [2,4,8,10], "num_leaves":[2,5,10,20,]}
clf = lgb.LGBMRegressor(boosting_type="gbdt",objective="regression",learning_rate=0.01, \
                        bagging_freq=1,colsample_bytree=0.8, bagging_fraction=0.8, \
                        max_bin=1000, scale_pos_weight=1, \
                        metric= "mse", n_threads = 3,n_estimators= 99999, verbose = 0,)
grid = GridSearchCV(estimator = clf, param_grid = grid_params, cv = 5, verbose = 2, scoring="neg_mean_squared_error")
grid.fit(X_train, y_train, eval_set = [(X_test, y_test)], early_stopping_rounds = 10, verbose = 0, categorical_feature = [1,2,3,5,6,9,12,13])

Fitting 5 folds for each of 16 candidates, totalling 80 fits
[CV] depth=2, num_leaves=2 ...........................................


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=2, total=   0.4s
[CV] depth=2, num_leaves=2 ...........................................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.4s remaining:    0.0s
New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=2, total=   0.4s
[CV] depth=2, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=2, total=   0.4s
[CV] depth=2, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=2, total=   0.5s
[CV] depth=2, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=2, total=   0.5s
[CV] depth=2, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=5, total=   0.3s
[CV] depth=2, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=5, total=   0.3s
[CV] depth=2, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=5, total=   0.4s
[CV] depth=2, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=5, total=   0.3s
[CV] depth=2, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=2, num_leaves=5, total=   0.3s
[CV] depth=2, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=10, total=   0.4s
[CV] depth=2, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=10, total=   0.5s
[CV] depth=2, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=10, total=   0.5s
[CV] depth=2, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=10, total=   0.4s
[CV] depth=2, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=10, total=   0.4s
[CV] depth=2, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=20, total=   0.5s
[CV] depth=2, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=20, total=   0.6s
[CV] depth=2, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=20, total=   0.5s
[CV] depth=2, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=20, total=   0.4s
[CV] depth=2, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=2, num_leaves=20, total=   0.4s
[CV] depth=4, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=2, total=   0.4s
[CV] depth=4, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=2, total=   0.5s
[CV] depth=4, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=2, total=   0.4s
[CV] depth=4, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=2, total=   0.5s
[CV] depth=4, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=2, total=   0.5s
[CV] depth=4, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=5, total=   0.3s
[CV] depth=4, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=5, total=   0.3s
[CV] depth=4, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=5, total=   0.4s
[CV] depth=4, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=5, total=   0.3s
[CV] depth=4, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=4, num_leaves=5, total=   0.3s
[CV] depth=4, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=10, total=   0.4s
[CV] depth=4, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=10, total=   0.5s
[CV] depth=4, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=10, total=   0.4s
[CV] depth=4, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=10, total=   0.4s
[CV] depth=4, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=10, total=   0.4s
[CV] depth=4, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=20, total=   0.5s
[CV] depth=4, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=20, total=   0.6s
[CV] depth=4, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=20, total=   0.7s
[CV] depth=4, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=20, total=   0.4s
[CV] depth=4, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=4, num_leaves=20, total=   0.4s
[CV] depth=8, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=2, total=   0.4s
[CV] depth=8, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=2, total=   0.4s
[CV] depth=8, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=2, total=   0.4s
[CV] depth=8, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=2, total=   0.5s
[CV] depth=8, num_leaves=2 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=2, total=   0.5s
[CV] depth=8, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=5, total=   0.3s
[CV] depth=8, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=5, total=   0.9s
[CV] depth=8, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=5, total=   0.4s
[CV] depth=8, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=5, total=   0.3s
[CV] depth=8, num_leaves=5 ...........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................ depth=8, num_leaves=5, total=   0.4s
[CV] depth=8, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=10, total=   0.4s
[CV] depth=8, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=10, total=   0.5s
[CV] depth=8, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=10, total=   0.6s
[CV] depth=8, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=10, total=   0.4s
[CV] depth=8, num_leaves=10 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=10, total=   0.5s
[CV] depth=8, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=20, total=   1.2s
[CV] depth=8, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=20, total=   0.7s
[CV] depth=8, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=20, total=   0.5s
[CV] depth=8, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=20, total=   0.4s
[CV] depth=8, num_leaves=20 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=8, num_leaves=20, total=   0.4s
[CV] depth=10, num_leaves=2 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=2, total=   0.5s
[CV] depth=10, num_leaves=2 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=2, total=   0.4s
[CV] depth=10, num_leaves=2 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=2, total=   0.4s
[CV] depth=10, num_leaves=2 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=2, total=   0.5s
[CV] depth=10, num_leaves=2 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=2, total=   0.6s
[CV] depth=10, num_leaves=5 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=5, total=   0.3s
[CV] depth=10, num_leaves=5 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=5, total=   0.5s
[CV] depth=10, num_leaves=5 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=5, total=   0.4s
[CV] depth=10, num_leaves=5 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=5, total=   0.4s
[CV] depth=10, num_leaves=5 ..........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........................... depth=10, num_leaves=5, total=   0.4s
[CV] depth=10, num_leaves=10 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=10, total=   0.4s
[CV] depth=10, num_leaves=10 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=10, total=   0.5s
[CV] depth=10, num_leaves=10 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=10, total=   0.4s
[CV] depth=10, num_leaves=10 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=10, total=   0.4s
[CV] depth=10, num_leaves=10 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=10, total=   0.4s
[CV] depth=10, num_leaves=20 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=20, total=   0.5s
[CV] depth=10, num_leaves=20 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=20, total=   0.6s
[CV] depth=10, num_leaves=20 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=20, total=   0.5s
[CV] depth=10, num_leaves=20 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=20, total=   0.5s
[CV] depth=10, num_leaves=20 .........................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] .......................... depth=10, num_leaves=20, total=   0.4s


[Parallel(n_jobs=1)]: Done  80 out of  80 | elapsed:   36.2s finished
New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


GridSearchCV(cv=5, error_score=nan,
             estimator=LGBMRegressor(bagging_fraction=0.8, bagging_freq=1,
                                     boosting_type='gbdt', class_weight=None,
                                     colsample_bytree=0.8,
                                     importance_type='split',
                                     learning_rate=0.01, max_bin=1000,
                                     max_depth=-1, metric='mse',
                                     min_child_samples=20,
                                     min_child_weight=0.001, min_split_gain=0.0,
                                     n_estimators=99999, n_jobs=-1, n_threads=3,
                                     num_leaves...ve='regression',
                                     random_state=None, reg_alpha=0.0,
                                     reg_lambda=0.0, scale_pos_weight=1,
                                     silent=True, subsample=1.0,
                                     subsample_for_bin=20

In [9]:
grid.best_params_

{'depth': 2, 'num_leaves': 5}

In [10]:
grid.best_score_

-0.006282281779430925

In [11]:
mean_squared_error(y_test, grid.best_estimator_.predict(X_test))

0.006502144954601772

In [12]:
grid_params = {"min_child_weight":[120,150,170,200,250,400,450,]}
clf = lgb.LGBMRegressor(boosting_type="gbdt",objective="regression",learning_rate=0.01, \
                        bagging_freq=1,colsample_bytree=0.8, bagging_fraction=0.8, \
                        max_bin=1000, scale_pos_weight=1, \
                        metric= "mse", n_threads = 3,n_estimators= 99999, verbose = 0, \
                        depth = 2, num_leaves = 5)
grid = GridSearchCV(estimator = clf, param_grid = grid_params, cv = 5, verbose = 2, scoring="neg_mean_squared_error")
grid.fit(X_train, y_train, eval_set = [(X_test, y_test)], early_stopping_rounds = 10, verbose = 0, categorical_feature = [1,2,3,5,6,9,12,13])

Fitting 5 folds for each of 7 candidates, totalling 35 fits
[CV] min_child_weight=120 ............................................


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=120, total=   0.4s
[CV] min_child_weight=120 ............................................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.4s remaining:    0.0s
New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=120, total=   0.4s
[CV] min_child_weight=120 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=120, total=   0.4s
[CV] min_child_weight=120 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=120, total=   0.4s
[CV] min_child_weight=120 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=120, total=   0.4s
[CV] min_child_weight=150 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=150, total=   0.4s
[CV] min_child_weight=150 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=150, total=   0.3s
[CV] min_child_weight=150 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=150, total=   0.4s
[CV] min_child_weight=150 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=150, total=   0.3s
[CV] min_child_weight=150 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=150, total=   0.4s
[CV] min_child_weight=170 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=170, total=   0.3s
[CV] min_child_weight=170 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=170, total=   0.3s
[CV] min_child_weight=170 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=170, total=   0.4s
[CV] min_child_weight=170 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=170, total=   0.5s
[CV] min_child_weight=170 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=170, total=   0.4s
[CV] min_child_weight=200 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=200, total=   0.3s
[CV] min_child_weight=200 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=200, total=   0.4s
[CV] min_child_weight=200 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=200, total=   0.5s
[CV] min_child_weight=200 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=200, total=   0.4s
[CV] min_child_weight=200 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=200, total=   0.4s
[CV] min_child_weight=250 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=250, total=   0.4s
[CV] min_child_weight=250 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=250, total=   0.4s
[CV] min_child_weight=250 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=250, total=   0.5s
[CV] min_child_weight=250 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=250, total=   0.4s
[CV] min_child_weight=250 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=250, total=   0.4s
[CV] min_child_weight=400 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=400, total=   0.4s
[CV] min_child_weight=400 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=400, total=   0.4s
[CV] min_child_weight=400 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=400, total=   0.4s
[CV] min_child_weight=400 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=400, total=   0.4s
[CV] min_child_weight=400 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=400, total=   0.4s
[CV] min_child_weight=450 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=450, total=   0.4s
[CV] min_child_weight=450 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=450, total=   0.4s
[CV] min_child_weight=450 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=450, total=   0.5s
[CV] min_child_weight=450 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=450, total=   0.5s
[CV] min_child_weight=450 ............................................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ............................. min_child_weight=450, total=   0.4s


[Parallel(n_jobs=1)]: Done  35 out of  35 | elapsed:   14.1s finished
New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


GridSearchCV(cv=5, error_score=nan,
             estimator=LGBMRegressor(bagging_fraction=0.8, bagging_freq=1,
                                     boosting_type='gbdt', class_weight=None,
                                     colsample_bytree=0.8, depth=2,
                                     importance_type='split',
                                     learning_rate=0.01, max_bin=1000,
                                     max_depth=-1, metric='mse',
                                     min_child_samples=20,
                                     min_child_weight=0.001, min_split_gain=0.0,
                                     n_estimators=99999, n_jobs=-1, n_threads=3,
                                     nu...egression',
                                     random_state=None, reg_alpha=0.0,
                                     reg_lambda=0.0, scale_pos_weight=1,
                                     silent=True, subsample=1.0,
                                     subsample_for_bin=200000

In [13]:
grid.best_params_

{'min_child_weight': 250}

In [14]:
grid.best_score_

-0.006217947880967147

In [15]:
mean_squared_error(y_test, grid.best_estimator_.predict(X_test))

0.006448070213684092

In [16]:
grid_params = {"colsample_bytree":[0.4,0.6,0.8,0.9,1],"bagging_fraction":[0.3,0.4,0.6,0.8,1]}
clf = lgb.LGBMRegressor(boosting_type="gbdt",objective="regression",learning_rate=0.01, \
                        bagging_freq=1, \
                        max_bin=1000, scale_pos_weight=1, \
                        metric= "mse", n_threads = 3,n_estimators= 99999, verbose = 0, \
                        depth = 2, num_leaves = 5, min_child_weight = 250,)
grid = GridSearchCV(estimator = clf, param_grid = grid_params, cv = 5, verbose = 2, scoring="neg_mean_squared_error")
grid.fit(X_train, y_train, eval_set = [(X_test, y_test)], early_stopping_rounds = 10, verbose = 0, categorical_feature = [1,2,3,5,6,9,12,13])

Fitting 5 folds for each of 25 candidates, totalling 125 fits
[CV] bagging_fraction=0.3, colsample_bytree=0.4 ......................


[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.4 ......................


[Parallel(n_jobs=1)]: Done   1 out of   1 | elapsed:    0.4s remaining:    0.0s
New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.4, total=   0.5s
[CV] bagging_fraction=0.3, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.4, total=   0.5s
[CV] bagging_fraction=0.3, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.6, total=   0.5s
[CV] bagging_fraction=0.3, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.8, total=   0.3s
[CV] bagging_fraction=0.3, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.8, total=   0.5s
[CV] bagging_fraction=0.3, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.8, total=   0.5s
[CV] bagging_fraction=0.3, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.8, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.8, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.9, total=   0.3s
[CV] bagging_fraction=0.3, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.9, total=   0.3s
[CV] bagging_fraction=0.3, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.3, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.3, colsample_bytree=1, total=   0.3s
[CV] bagging_fraction=0.3, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.3, colsample_bytree=1, total=   0.5s
[CV] bagging_fraction=0.3, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.3, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.3, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.3, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.3, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.4, total=   0.3s
[CV] bagging_fraction=0.4, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.6, total=   0.3s
[CV] bagging_fraction=0.4, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.6, total=   0.5s
[CV] bagging_fraction=0.4, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.6, total=   0.5s
[CV] bagging_fraction=0.4, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.8, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.8, total=   0.3s
[CV] bagging_fraction=0.4, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.8, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.8, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.8, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.9, total=   0.3s
[CV] bagging_fraction=0.4, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.9, total=   0.3s
[CV] bagging_fraction=0.4, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.4, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.4, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.4, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.4, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.4, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.4, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.4, colsample_bytree=1, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.6, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.4, total=   0.5s
[CV] bagging_fraction=0.6, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.6, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.6, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.6, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.6, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.6, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.6, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.6, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.6, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.8, total=   0.5s
[CV] bagging_fraction=0.6, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.8, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.8, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.8, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.8, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.9, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.6, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.9, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.9, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.6, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.6, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.6, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.6, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.6, colsample_bytree=1, total=   0.3s
[CV] bagging_fraction=0.6, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.6, colsample_bytree=1, total=   1.1s
[CV] bagging_fraction=0.6, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.6, colsample_bytree=1, total=   0.6s
[CV] bagging_fraction=0.6, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.6, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.4, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.4, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.4, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=0.4 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.4, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.6, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.6, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.6, total=   0.7s
[CV] bagging_fraction=0.8, colsample_bytree=0.6 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.8, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.8, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.8, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.8, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.8 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.8, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.9, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.9, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=0.9 ......................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ....... bagging_fraction=0.8, colsample_bytree=0.9, total=   0.6s
[CV] bagging_fraction=0.8, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.8, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.8, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.8, colsample_bytree=1, total=   0.5s
[CV] bagging_fraction=0.8, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.8, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=0.8, colsample_bytree=1 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=0.8, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=0.4 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.4, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.4 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=0.4 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.4, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=0.4 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.4, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.4 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.4, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.6 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.6, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.6 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=0.6 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.6, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=0.6 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.6, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.6 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.6, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.8 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.8, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.8 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.8, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=0.8 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.8, total=   0.5s
[CV] bagging_fraction=1, colsample_bytree=0.8 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.8, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.8 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.8, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.9 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=0.9 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=0.9 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.9, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=0.9 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.9, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=0.9 ........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ......... bagging_fraction=1, colsample_bytree=0.9, total=   0.3s
[CV] bagging_fraction=1, colsample_bytree=1 ..........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........... bagging_fraction=1, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=1 ..........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........... bagging_fraction=1, colsample_bytree=1, total=   0.5s
[CV] bagging_fraction=1, colsample_bytree=1 ..........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........... bagging_fraction=1, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=1 ..........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........... bagging_fraction=1, colsample_bytree=1, total=   0.4s
[CV] bagging_fraction=1, colsample_bytree=1 ..........................


New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


[CV] ........... bagging_fraction=1, colsample_bytree=1, total=   0.4s


[Parallel(n_jobs=1)]: Done 125 out of 125 | elapsed:   50.6s finished
New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


GridSearchCV(cv=5, error_score=nan,
             estimator=LGBMRegressor(bagging_freq=1, boosting_type='gbdt',
                                     class_weight=None, colsample_bytree=1.0,
                                     depth=2, importance_type='split',
                                     learning_rate=0.01, max_bin=1000,
                                     max_depth=-1, metric='mse',
                                     min_child_samples=20, min_child_weight=250,
                                     min_split_gain=0.0, n_estimators=99999,
                                     n_jobs=-1, n_threads=3, num_leaves=5,
                                     objective='r...
                                     reg_alpha=0.0, reg_lambda=0.0,
                                     scale_pos_weight=1, silent=True,
                                     subsample=1.0, subsample_for_bin=200000,
                                     subsample_freq=0, verbose=0),
             iid='deprecated', n_jo

In [17]:
grid.best_params_

{'bagging_fraction': 0.8, 'colsample_bytree': 0.9}

In [18]:
grid.best_score_

-0.006198258285215179

In [19]:
mean_squared_error(y_test, grid.best_estimator_.predict(X_test))

0.006433414062505371

Now, most of the parameters have been optimised, so lower the learning rate and rerun the algorithm:

In [20]:
clf = lgb.LGBMRegressor(boosting_type="gbdt",objective="regression",learning_rate=0.001, \
                        bagging_freq=1, \
                        max_bin=100000, scale_pos_weight=1, \
                        metric= "mse", n_threads = 3,n_estimators= 99999, \
                        depth = 2, num_leaves = 5, min_child_weight = 250, \
                        colsample_bytree = 0.9, bagging_fraction = 0.8)
clf.fit(X_train, y_train, eval_set = [(X_test, y_test)], early_stopping_rounds = 30, verbose = 2, categorical_feature = [1,2,3,5,6,9,12,13])

New categorical_feature is [1, 2, 3, 5, 6, 9, 12, 13]
  'New categorical_feature is {}'.format(sorted(list(categorical_feature))))


Training until validation scores don't improve for 30 rounds
[2]	valid_0's l2: 0.0100897
[4]	valid_0's l2: 0.010077
[6]	valid_0's l2: 0.0100646
[8]	valid_0's l2: 0.0100522
[10]	valid_0's l2: 0.0100396
[12]	valid_0's l2: 0.0100267
[14]	valid_0's l2: 0.0100138
[16]	valid_0's l2: 0.0100016
[18]	valid_0's l2: 0.00998898
[20]	valid_0's l2: 0.00997645
[22]	valid_0's l2: 0.00996376
[24]	valid_0's l2: 0.00995444
[26]	valid_0's l2: 0.00994182
[28]	valid_0's l2: 0.00992928
[30]	valid_0's l2: 0.00991661
[32]	valid_0's l2: 0.00990436
[34]	valid_0's l2: 0.00989254
[36]	valid_0's l2: 0.00988019
[38]	valid_0's l2: 0.00986837
[40]	valid_0's l2: 0.00985589
[42]	valid_0's l2: 0.00984395
[44]	valid_0's l2: 0.00983205
[46]	valid_0's l2: 0.00981992
[48]	valid_0's l2: 0.00980793
[50]	valid_0's l2: 0.00979623
[52]	valid_0's l2: 0.00978414
[54]	valid_0's l2: 0.00977262
[56]	valid_0's l2: 0.00976086
[58]	valid_0's l2: 0.00974887
[60]	valid_0's l2: 0.00973715
[62]	valid_0's l2: 0.0097252
[64]	valid_0's l2: 0.00

LGBMRegressor(bagging_fraction=0.8, bagging_freq=1, boosting_type='gbdt',
              class_weight=None, colsample_bytree=0.9, depth=2,
              importance_type='split', learning_rate=0.001, max_bin=100000,
              max_depth=-1, metric='mse', min_child_samples=20,
              min_child_weight=250, min_split_gain=0.0, n_estimators=99999,
              n_jobs=-1, n_threads=3, num_leaves=5, objective='regression',
              random_state=None, reg_alpha=0.0, reg_lambda=0.0,
              scale_pos_weight=1, silent=True, subsample=1.0,
              subsample_for_bin=200000, subsample_freq=0)