In [1]:
import gc
import time
import pandas as pd
import numpy as np
import xgboost as xgb
import lightgbm as lgb

from sklearn.metrics import log_loss
from sklearn.model_selection import train_test_split, StratifiedKFold
from sklearn.feature_extraction.text import TfidfVectorizer, CountVectorizer

from bayes_opt import BayesianOptimization
from models_utils_fe import *



In [2]:
def xgb_bo(max_depth, min_child_weight, subsample, colsample_bytree):
    
    t = time.time()
    params = {
    'seed': 1337,
    'colsample_bytree': max(min(colsample_bytree, 1), 0),
    'silent': 1,
    'subsample': max(min(subsample, 1), 0),
    'eta': 0.05,
    'objective': 'binary:logistic',
    'eval_metric': 'logloss',
    'max_depth': int(max_depth),
    'min_child_weight': int(min_child_weight),
    'nthread': 4,
    'tree_method': 'hist',
    }
    
    dtrain = xgb.DMatrix(X_tr, label = y_tr)
    dval = xgb.DMatrix(X_val, label = y_val)
    watchlist = [(dtrain, 'train'), (dval, 'valid')]

    print('Start training...')
    gbm = xgb.train(params, dtrain, 100000, watchlist, 
                    early_stopping_rounds = 100, verbose_eval = 100)
    val_pred = gbm.predict(xgb.DMatrix(X_val), ntree_limit=gbm.best_ntree_limit)
    score = log_loss(y_val, val_pred)
    print('Final score:', score, '\n', 'Time it took to train and predict:', time.time() - t)
    return -score


def lgb_bo(max_depth, min_data_in_leaf, subsample, colsample_bytree, feature_fraction):
    params = {
        'task' : 'train',
        'boosting_type' : 'gbdt',
        'objective' : 'binary',
        'metric' : {'binary_logloss'},
        'learning_rate' : 0.05,
        'feature_fraction' : max(min(feature_fraction, 1), 0),
        'bagging_fraction': 0.9,
        'bagging_freq': 100,
        'num_leaves' : 255,
        'max_depth': int(max_depth),
        'min_data_in_leaf': int(min_data_in_leaf),
        'subsample': max(min(subsample, 1), 0),
        'colsample_bytree': max(min(colsample_bytree, 1), 0),
        'silent': 1,
        'random_state': 1337,
        'verbose': 1,
        'nthread': 9,
    }

    lgb_train = lgb.Dataset(X_tr, y_tr.is_duplicate.values)
    lgb_val = lgb.Dataset(X_val, y_val.is_duplicate.values)
    t = time.time()
    print('Start training...')
    gbm = lgb.train(params, lgb_train, num_boost_round = 100000, valid_sets = lgb_val,
                    early_stopping_rounds = 100, verbose_eval = 100)
    val_pred = gbm.predict(X_val, num_iteration=gbm.best_iteration)
    score = log_loss(y_val, val_pred)
    print('Final score:', score, '\n', 'Time it took to train and predict:', time.time() - t)
    return -score

In [6]:
src = '/media/w/1c392724-ecf3-4615-8f3c-79368ec36380/DS Projects/Kaggle/Quora/scripts/features/'
feats_src = '/media/w/1c392724-ecf3-4615-8f3c-79368ec36380/DS Projects/Kaggle/Quora/data/features/uncleaned/'

X_train = pd.read_pickle('Xtrain_825colsCurrentBest.pkl')
new_set = pd.read_pickle('train_NewSubset_BestAbhishek.pkl')
new_set.columns = ['{}_abhishek_new_lemmat'.format(i) for i in range(new_set.shape[1])]
new_network = pd.read_pickle('train_networkfeats_weighted_30.05.pkl')

xgb_feats = pd.read_csv(feats_src + '/the_1owl/owl_train.csv')
y_train = xgb_feats[['is_duplicate']]

for col in new_network.columns:
    X_train[col] = new_network[col]

X_train = pd.concat([X_train, new_set], axis = 1)
X_train = X_train.astype('float32')
print(X_train.shape)

X_tr, X_val, y_tr, y_val = train_test_split(X_train, y_train, stratify = y_train,
                                                    test_size = 0.2, random_state = 111)

del xgb_feats, new_set, new_network, X_train
gc.collect()

(404290, 905)


395

Step |   Time |      Value |   colsample_bytree |   feature_fraction |   max_depth |   min_data_in_leaf |   subsample | 

*  15 | 05m01s |   -0.18297 |             0.3500 |             0.5717 |      6.0000 |            27.8939 |      0.6900 |
* 7 | 03m49s |   -0.18385 |             0.3641 |             0.4773 |      6.3882 |            20.4263 |      0.8623 | 
*  9 | 03m29s |   -0.18331 |             0.4370 |             0.5345 |      7.6824 |            16.8610 |      0.7681 | 
*    13 | 03m11s |   -0.18492 |             0.5000 |             0.5032 |     10.0000 |            27.9822 |      0.6900 | 

In [8]:
lgbBO = BayesianOptimization(lgb_bo, {
        'max_depth': (6, 10),
        'min_data_in_leaf': (15, 28),
        'subsample': (0.69, 0.88),
        'colsample_bytree': (0.35, 0.5),
        'feature_fraction': (0.35, 0.65),
    })

num_iter = 15
init_points = 10
lgbBO.maximize(init_points=init_points, n_iter=num_iter)
print('lgb: %f' % lgbBO.res['max']['max_val'])

[31mInitialization[0m
[94m------------------------------------------------------------------------------------------------------------------------[0m
 Step |   Time |      Value |   colsample_bytree |   feature_fraction |   max_depth |   min_data_in_leaf |   subsample | 
Start training...
Train until valid scores didn't improve in 100 rounds.
[100]	valid_0's binary_logloss: 0.229462
[200]	valid_0's binary_logloss: 0.215266
[300]	valid_0's binary_logloss: 0.209817
[400]	valid_0's binary_logloss: 0.207121
[500]	valid_0's binary_logloss: 0.205499
[600]	valid_0's binary_logloss: 0.204589
[700]	valid_0's binary_logloss: 0.203774
[800]	valid_0's binary_logloss: 0.203344
[900]	valid_0's binary_logloss: 0.203177
[1000]	valid_0's binary_logloss: 0.202966
[1100]	valid_0's binary_logloss: 0.203027
Early stopping, best iteration is:
[1048]	valid_0's binary_logloss: 0.202936
Final score: 0.20296001502 
 Time it took to train and predict: 267.9007291793823
    1 | 04m27s | [35m  -0.20296[0m | 

Train until valid scores didn't improve in 100 rounds.
[100]	valid_0's binary_logloss: 0.195603
[200]	valid_0's binary_logloss: 0.187868
[300]	valid_0's binary_logloss: 0.185609
[400]	valid_0's binary_logloss: 0.184853
[500]	valid_0's binary_logloss: 0.184644
Early stopping, best iteration is:
[466]	valid_0's binary_logloss: 0.184432
Final score: 0.18443798461 
 Time it took to train and predict: 188.7857644557953
   10 | 03m08s |   -0.18444 |             0.4191 |             0.5459 |      9.9391 |            22.4966 |      0.7184 | 
[31mBayesian Optimization[0m
[94m------------------------------------------------------------------------------------------------------------------------[0m
 Step |   Time |      Value |   colsample_bytree |   feature_fraction |   max_depth |   min_data_in_leaf |   subsample | 
Start training...
Train until valid scores didn't improve in 100 rounds.
[100]	valid_0's binary_logloss: 0.203638
[200]	valid_0's binary_logloss: 0.193272
[300]	valid_0's binary

  " state: %s" % convergence_dict)


   14 | 04m32s |   -0.18404 |             0.4478 |             0.6500 |      6.0000 |            23.1621 |      0.6900 | 
Start training...
Train until valid scores didn't improve in 100 rounds.
[100]	valid_0's binary_logloss: 0.20374
[200]	valid_0's binary_logloss: 0.193147
[300]	valid_0's binary_logloss: 0.189679
[400]	valid_0's binary_logloss: 0.18791
[500]	valid_0's binary_logloss: 0.186757
[600]	valid_0's binary_logloss: 0.186008
[700]	valid_0's binary_logloss: 0.185528
[800]	valid_0's binary_logloss: 0.18508
[900]	valid_0's binary_logloss: 0.184623
[1000]	valid_0's binary_logloss: 0.184278
[1100]	valid_0's binary_logloss: 0.183954
[1200]	valid_0's binary_logloss: 0.183776
[1300]	valid_0's binary_logloss: 0.183621
[1400]	valid_0's binary_logloss: 0.183493
[1500]	valid_0's binary_logloss: 0.183369
[1600]	valid_0's binary_logloss: 0.183244
[1700]	valid_0's binary_logloss: 0.183016
[1800]	valid_0's binary_logloss: 0.18304
Early stopping, best iteration is:
[1756]	valid_0's binary_log

  " state: %s" % convergence_dict)


   16 | 04m34s |   -0.18375 |             0.4136 |             0.6500 |      7.9793 |            15.0000 |      0.6900 | 
Start training...
Train until valid scores didn't improve in 100 rounds.
[100]	valid_0's binary_logloss: 0.203513
[200]	valid_0's binary_logloss: 0.193349
[300]	valid_0's binary_logloss: 0.190083
[400]	valid_0's binary_logloss: 0.18833
[500]	valid_0's binary_logloss: 0.187327
[600]	valid_0's binary_logloss: 0.186565
[700]	valid_0's binary_logloss: 0.186077
[800]	valid_0's binary_logloss: 0.185408
[900]	valid_0's binary_logloss: 0.185005
[1000]	valid_0's binary_logloss: 0.184704
[1100]	valid_0's binary_logloss: 0.18448
[1200]	valid_0's binary_logloss: 0.184336
[1300]	valid_0's binary_logloss: 0.18407
[1400]	valid_0's binary_logloss: 0.183954
[1500]	valid_0's binary_logloss: 0.183879
[1600]	valid_0's binary_logloss: 0.183644
[1700]	valid_0's binary_logloss: 0.183391
[1800]	valid_0's binary_logloss: 0.183428
Early stopping, best iteration is:
[1700]	valid_0's binary_lo

  " state: %s" % convergence_dict)


   18 | 05m03s |   -0.18339 |             0.5000 |             0.6500 |      6.0000 |            20.9712 |      0.6900 | 
Start training...
Train until valid scores didn't improve in 100 rounds.
[100]	valid_0's binary_logloss: 0.195858
[200]	valid_0's binary_logloss: 0.188324
[300]	valid_0's binary_logloss: 0.186144
[400]	valid_0's binary_logloss: 0.185509
[500]	valid_0's binary_logloss: 0.185388
Early stopping, best iteration is:
[467]	valid_0's binary_logloss: 0.185218
Final score: 0.185232922101 
 Time it took to train and predict: 219.10521030426025
   19 | 04m05s |   -0.18523 |             0.3500 |             0.6500 |     10.0000 |            18.0077 |      0.8800 | 
Start training...
Train until valid scores didn't improve in 100 rounds.
[100]	valid_0's binary_logloss: 0.240768
[200]	valid_0's binary_logloss: 0.224385
[300]	valid_0's binary_logloss: 0.218325
[400]	valid_0's binary_logloss: 0.214758
[500]	valid_0's binary_logloss: 0.212582
[600]	valid_0's binary_logloss: 0.210846

  " state: %s" % convergence_dict)


   22 | 04m07s |   -0.18523 |             0.3500 |             0.6500 |     10.0000 |            20.7424 |      0.6900 | 
Start training...
Train until valid scores didn't improve in 100 rounds.
[100]	valid_0's binary_logloss: 0.203607
[200]	valid_0's binary_logloss: 0.193478
[300]	valid_0's binary_logloss: 0.19006
[400]	valid_0's binary_logloss: 0.188297
[500]	valid_0's binary_logloss: 0.187312
[600]	valid_0's binary_logloss: 0.186553
[700]	valid_0's binary_logloss: 0.185877
[800]	valid_0's binary_logloss: 0.185356
[900]	valid_0's binary_logloss: 0.18485
[1000]	valid_0's binary_logloss: 0.184662
[1100]	valid_0's binary_logloss: 0.184533
[1200]	valid_0's binary_logloss: 0.184389
[1300]	valid_0's binary_logloss: 0.184221
[1400]	valid_0's binary_logloss: 0.184077
[1500]	valid_0's binary_logloss: 0.183962
Early stopping, best iteration is:
[1493]	valid_0's binary_logloss: 0.183933
Final score: 0.183937515463 
 Time it took to train and predict: 272.5420994758606
   23 | 04m55s |   -0.1839



   24 | 04m05s |   -0.18502 |             0.5000 |             0.6500 |     10.0000 |            16.4653 |      0.6900 | 
Start training...
Train until valid scores didn't improve in 100 rounds.
[100]	valid_0's binary_logloss: 0.194892
[200]	valid_0's binary_logloss: 0.187571
[300]	valid_0's binary_logloss: 0.185677
[400]	valid_0's binary_logloss: 0.185158
Early stopping, best iteration is:
[375]	valid_0's binary_logloss: 0.185003
Final score: 0.185006663093 
 Time it took to train and predict: 206.67720913887024


  " state: %s" % convergence_dict)


   25 | 03m49s |   -0.18501 |             0.3500 |             0.6500 |     10.0000 |            26.4377 |      0.7411 | 
lgb: -0.182971


Step |   Time |      Value |   colsample_bytree |   max_depth |   min_child_weight |   subsample | 

* 2 | 27m56s |   -0.18223 |             0.4418 |      6.6308 |            21.9368 |      0.8242 | 
* 16 | 26m18s |   -0.18250 |             0.4628 |      7.6076 |            21.3771 |      0.8899 | 
* 13 | 32m26s |   -0.18254 |             0.4265 |      5.0034 |            29.9491 |      0.8833 | 

In [7]:
xgbBO = BayesianOptimization(xgb_bo, {
        'max_depth': (5, 10),
        'min_child_weight': (15, 30),
        'subsample': (0.69, 0.89),
        'colsample_bytree': (0.35, 0.47),
    })

num_iter = 15
init_points = 10
xgbBO.maximize(init_points=init_points, n_iter=num_iter)
print('XGB: %f' % xgbBO.res['max']['max_val'])

[31mInitialization[0m
[94m---------------------------------------------------------------------------------------------------[0m
 Step |   Time |      Value |   colsample_bytree |   max_depth |   min_child_weight |   subsample | 
Start training...
[0]	train-logloss:0.662004	valid-logloss:0.662131
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.202054	valid-logloss:0.206741
[200]	train-logloss:0.188426	valid-logloss:0.19542
[300]	train-logloss:0.181745	valid-logloss:0.191759
[400]	train-logloss:0.176674	valid-logloss:0.189656
[500]	train-logloss:0.172359	valid-logloss:0.188406
[600]	train-logloss:0.168297	valid-logloss:0.187367
[700]	train-logloss:0.164542	valid-logloss:0.186715
[800]	train-logloss:0.161137	valid-logloss:0.186278
[900]	train-logloss:0.157914	valid-logloss:0.18587
[1000]	train-logloss:0.154678	valid-logloss:0.1855
[1100]	train-logloss:0.151625

Start training...
[0]	train-logloss:0.659508	valid-logloss:0.65983
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.178195	valid-logloss:0.195713
[200]	train-logloss:0.155682	valid-logloss:0.187876
[300]	train-logloss:0.139175	valid-logloss:0.185768
[400]	train-logloss:0.125671	valid-logloss:0.184625
[500]	train-logloss:0.113595	valid-logloss:0.183765
[600]	train-logloss:0.103052	valid-logloss:0.183386
[700]	train-logloss:0.093999	valid-logloss:0.183166
[800]	train-logloss:0.085941	valid-logloss:0.18306
Stopping. Best iteration:
[789]	train-logloss:0.086697	valid-logloss:0.183008

Final score: 0.183008218923 
 Time it took to train and predict: 1106.8105146884918
    7 | 18m26s |   -0.18301 |             0.3782 |      9.5205 |            15.7572 |      0.8652 | 
Start training...
[0]	train-logloss:0.659586	valid-logloss:0.659944
Multiple eval metrics have been pa



[31mBayesian Optimization[0m
[94m---------------------------------------------------------------------------------------------------[0m
 Step |   Time |      Value |   colsample_bytree |   max_depth |   min_child_weight |   subsample | 
Start training...
[0]	train-logloss:0.661997	valid-logloss:0.662127
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.202179	valid-logloss:0.206934
[200]	train-logloss:0.18822	valid-logloss:0.195477
[300]	train-logloss:0.180913	valid-logloss:0.191716
[400]	train-logloss:0.175566	valid-logloss:0.189626
[500]	train-logloss:0.171031	valid-logloss:0.188414
[600]	train-logloss:0.166773	valid-logloss:0.187465
[700]	train-logloss:0.162898	valid-logloss:0.186806
[800]	train-logloss:0.159267	valid-logloss:0.186218
[900]	train-logloss:0.155723	valid-logloss:0.185749
[1000]	train-logloss:0.152367	valid-logloss:0.185362
[1100]	train-loglos

  " state: %s" % convergence_dict)


   11 | 32m05s |   -0.18269 |             0.4618 |      5.0117 |            15.0176 |      0.8503 | 
Start training...
[0]	train-logloss:0.662005	valid-logloss:0.662124
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.20202	valid-logloss:0.206607
[200]	train-logloss:0.188351	valid-logloss:0.195383
[300]	train-logloss:0.181498	valid-logloss:0.191541
[400]	train-logloss:0.176363	valid-logloss:0.189703
[500]	train-logloss:0.171741	valid-logloss:0.188403
[600]	train-logloss:0.167677	valid-logloss:0.187538
[700]	train-logloss:0.163713	valid-logloss:0.186934
[800]	train-logloss:0.160047	valid-logloss:0.186361
[900]	train-logloss:0.156602	valid-logloss:0.185982
[1000]	train-logloss:0.153191	valid-logloss:0.185615
[1100]	train-logloss:0.149956	valid-logloss:0.18528
[1200]	train-logloss:0.146961	valid-logloss:0.184995
[1300]	train-logloss:0.143985	valid-logloss:0.18466
[1

  " state: %s" % convergence_dict)


   14 | 21m46s |   -0.18259 |             0.4604 |      8.5407 |            19.7691 |      0.8841 | 
Start training...
[0]	train-logloss:0.660494	valid-logloss:0.660713
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.190047	valid-logloss:0.199036
[200]	train-logloss:0.173739	valid-logloss:0.190106
[300]	train-logloss:0.162653	valid-logloss:0.187442
[400]	train-logloss:0.152804	valid-logloss:0.186094
[500]	train-logloss:0.144004	valid-logloss:0.184988
[600]	train-logloss:0.136173	valid-logloss:0.184552
[700]	train-logloss:0.129605	valid-logloss:0.184093
[800]	train-logloss:0.12298	valid-logloss:0.183729
[900]	train-logloss:0.117008	valid-logloss:0.183297
[1000]	train-logloss:0.111255	valid-logloss:0.183057
[1100]	train-logloss:0.105915	valid-logloss:0.182882
[1200]	train-logloss:0.101039	valid-logloss:0.182702
Stopping. Best iteration:
[1172]	train-logloss:0.1023

  " state: %s" % convergence_dict)


   15 | 20m44s |   -0.18265 |             0.4667 |      7.1499 |            15.0903 |      0.8836 | 
Start training...
[0]	train-logloss:0.660519	valid-logloss:0.660734
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.190718	valid-logloss:0.199369
[200]	train-logloss:0.174671	valid-logloss:0.190352
[300]	train-logloss:0.16403	valid-logloss:0.187778
[400]	train-logloss:0.155059	valid-logloss:0.186238
[500]	train-logloss:0.147021	valid-logloss:0.185113
[600]	train-logloss:0.140055	valid-logloss:0.184533
[700]	train-logloss:0.133397	valid-logloss:0.184118
[800]	train-logloss:0.126998	valid-logloss:0.183772
[900]	train-logloss:0.121793	valid-logloss:0.183453
[1000]	train-logloss:0.116455	valid-logloss:0.183137
[1100]	train-logloss:0.111094	valid-logloss:0.183023
[1200]	train-logloss:0.106134	valid-logloss:0.182929
[1300]	train-logloss:0.101535	valid-logloss:0.18283
[

  " state: %s" % convergence_dict)


   16 | 26m18s |   -0.18250 |             0.4628 |      7.6076 |            21.3771 |      0.8899 | 
Start training...
[0]	train-logloss:0.659632	valid-logloss:0.659947
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.180555	valid-logloss:0.195828
[200]	train-logloss:0.16003	valid-logloss:0.188378
[300]	train-logloss:0.144983	valid-logloss:0.186472
[400]	train-logloss:0.132435	valid-logloss:0.185505
[500]	train-logloss:0.121353	valid-logloss:0.184938
[600]	train-logloss:0.11137	valid-logloss:0.18452
[700]	train-logloss:0.102301	valid-logloss:0.184222
[800]	train-logloss:0.094101	valid-logloss:0.184079
[900]	train-logloss:0.086669	valid-logloss:0.184021
Stopping. Best iteration:
[846]	train-logloss:0.090633	valid-logloss:0.183941

Final score: 0.183941080747 
 Time it took to train and predict: 1020.3468532562256


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   17 | 17m19s |   -0.18394 |             0.4687 |      9.9157 |            20.3852 |      0.7002 | 
Start training...
[0]	train-logloss:0.660494	valid-logloss:0.660711
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.190369	valid-logloss:0.199296
[200]	train-logloss:0.173984	valid-logloss:0.190199
[300]	train-logloss:0.162828	valid-logloss:0.187574
[400]	train-logloss:0.153707	valid-logloss:0.186074
[500]	train-logloss:0.145494	valid-logloss:0.185099
[600]	train-logloss:0.13751	valid-logloss:0.184489
[700]	train-logloss:0.130566	valid-logloss:0.183958
[800]	train-logloss:0.124212	valid-logloss:0.183666
[900]	train-logloss:0.118497	valid-logloss:0.183261
[1000]	train-logloss:0.112517	valid-logloss:0.183066
[1100]	train-logloss:0.107478	valid-logloss:0.182876
[1200]	train-logloss:0.102424	valid-logloss:0.182744
Stopping. Best iteration:
[1175]	train-logloss:0.1036

  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   21 | 32m19s |   -0.18231 |             0.4683 |      6.7427 |            22.0700 |      0.8571 | 
Start training...
[0]	train-logloss:0.660634	valid-logloss:0.660823
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.191396	valid-logloss:0.200003
[200]	train-logloss:0.175335	valid-logloss:0.190649
[300]	train-logloss:0.164973	valid-logloss:0.187919
[400]	train-logloss:0.156727	valid-logloss:0.186663
[500]	train-logloss:0.149041	valid-logloss:0.185778
[600]	train-logloss:0.142401	valid-logloss:0.184934
[700]	train-logloss:0.135871	valid-logloss:0.184579
[800]	train-logloss:0.129967	valid-logloss:0.184099
[900]	train-logloss:0.123997	valid-logloss:0.183753
[1000]	train-logloss:0.118844	valid-logloss:0.183553
[1100]	train-logloss:0.113403	valid-logloss:0.183381
[1200]	train-logloss:0.10861	valid-logloss:0.183247
[1300]	train-logloss:0.104034	valid-logloss:0.183131


  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   22 | 24m33s |   -0.18286 |             0.3528 |      7.1260 |            22.0360 |      0.7892 | 
Start training...
[0]	train-logloss:0.661255	valid-logloss:0.661417
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.196212	valid-logloss:0.202226
[200]	train-logloss:0.181711	valid-logloss:0.192363
[300]	train-logloss:0.173185	valid-logloss:0.189275
[400]	train-logloss:0.166383	valid-logloss:0.187657
[500]	train-logloss:0.160304	valid-logloss:0.186473
[600]	train-logloss:0.155004	valid-logloss:0.185757
[700]	train-logloss:0.149827	valid-logloss:0.185246
[800]	train-logloss:0.145113	valid-logloss:0.184847
[900]	train-logloss:0.140605	valid-logloss:0.184655
[1000]	train-logloss:0.135988	valid-logloss:0.184375
[1100]	train-logloss:0.131575	valid-logloss:0.18401
[1200]	train-logloss:0.12754	valid-logloss:0.183772
[1300]	train-logloss:0.12362	valid-logloss:0.183496
[1

  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   23 | 23m19s |   -0.18297 |             0.4477 |      6.5282 |            20.4139 |      0.7595 | 
Start training...
[0]	train-logloss:0.662011	valid-logloss:0.662135
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.202169	valid-logloss:0.206764
[200]	train-logloss:0.188656	valid-logloss:0.19561
[300]	train-logloss:0.181772	valid-logloss:0.191749
[400]	train-logloss:0.17674	valid-logloss:0.189973
[500]	train-logloss:0.17234	valid-logloss:0.188668
[600]	train-logloss:0.168307	valid-logloss:0.187796
[700]	train-logloss:0.164474	valid-logloss:0.187135
[800]	train-logloss:0.160953	valid-logloss:0.186686
[900]	train-logloss:0.157671	valid-logloss:0.186317
[1000]	train-logloss:0.154346	valid-logloss:0.185894
[1100]	train-logloss:0.151182	valid-logloss:0.185517
[1200]	train-logloss:0.148301	valid-logloss:0.185262
[1300]	train-logloss:0.145428	valid-logloss:0.184878
[1

  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   24 | 26m03s |   -0.18379 |             0.4551 |      5.5275 |            22.2331 |      0.6914 | 
Start training...
[0]	train-logloss:0.662006	valid-logloss:0.662132
Multiple eval metrics have been passed: 'valid-logloss' will be used for early stopping.

Will train until valid-logloss hasn't improved in 100 rounds.
[100]	train-logloss:0.202068	valid-logloss:0.20679
[200]	train-logloss:0.188119	valid-logloss:0.1953
[300]	train-logloss:0.181256	valid-logloss:0.191731
[400]	train-logloss:0.176116	valid-logloss:0.18977
[500]	train-logloss:0.17155	valid-logloss:0.188407
[600]	train-logloss:0.16718	valid-logloss:0.187388
[700]	train-logloss:0.163424	valid-logloss:0.186672
[800]	train-logloss:0.159783	valid-logloss:0.186218
[900]	train-logloss:0.156275	valid-logloss:0.185652
[1000]	train-logloss:0.152981	valid-logloss:0.185349
[1100]	train-logloss:0.149868	valid-logloss:0.185089
[1200]	train-logloss:0.146899	valid-logloss:0.184807
[1300]	train-logloss:0.144039	valid-logloss:0.18458
[1400]

  " state: %s" % convergence_dict)
  " state: %s" % convergence_dict)


   25 | 29m28s |   -0.18297 |             0.3941 |      5.4764 |            16.5597 |      0.8856 | 
XGB: -0.182231
