In [1]:
import numpy as np
import pandas as pd

from sklearn.model_selection import StratifiedKFold
from sklearn.metrics import roc_auc_score

from catboost import CatBoostClassifier
from catboost import Pool

import os

In [2]:
def trainCatBoost(trainSet, targetSet, params={'depth': 7, 'rate': 0.03, 'l2': 8, 'T': 1},
                  folds=10, maxIter=1000, verbose=True, dirName =  '/tmp/porto/catboost/'):
    # create log directory
    dirName = dirName + str(params.get('depth')) + '_' + str(params.get('rate')) + \
              '_' + str(params.get('l2')) + '_' + str(params.get('T'))

    try:
        os.makedirs(dirName)
    except Exception as inst:
        print inst  # __str__ allows args to be printed directly

    treeList = list()
    scoreList = list()
    modelList = list()
    prob = np.zeros([trainSet.shape[0]])

    skf = StratifiedKFold(n_splits=folds, shuffle=True, random_state=42)

    for i, (train_index, val_index) in enumerate(skf.split(trainSet, targetSet)):
        model = CatBoostClassifier(verbose=verbose, iterations=maxIter, thread_count=4, eval_metric="AUC",
                                   depth=params['depth'], learning_rate=params['rate'],
                                   l2_leaf_reg=params['l2'], bagging_temperature=params['T'],
                                   od_type='Iter', od_wait=20,
                                   train_dir=dirName +"/"+ str(i), random_seed=i)

        # create pool
        trainPool = Pool(trainSet.iloc[train_index], targetSet.iloc[train_index],
                         feature_names=trainSet.columns.tolist())

        valPool = Pool(trainSet.iloc[val_index], targetSet.iloc[val_index],
                         feature_names=trainSet.columns.tolist())

        # fit and estimate the model
        model.fit(trainPool, eval_set=valPool, use_best_model=True)
        prob[val_index] = model.predict_proba(valPool)[:, 1]
        localScore = roc_auc_score(targetSet.iloc[val_index], prob[val_index])

        treeList.append(model.tree_count_)
        scoreList.append(localScore)
        modelList.append(model)
        
    score = roc_auc_score(targetSet, prob)
    return [score, treeList, scoreList, modelList]

In [5]:
def getData():
    """
    Return Pandas dataframe for training.
    :return: pandas dataframe
    """

    rawData = pd.read_csv('../data/train.csv', index_col='id')

    # drop _calc_ features
    dropList = list()
    for fName in rawData.columns.tolist():
        if fName.find('_calc_') > (-1):
            dropList.append(fName)
    df = rawData.drop(dropList, axis=1)

    # squared feature "ps_car_15"
    df = df.assign(ps_car_15_mod = np.power(df.ps_car_15,2).astype(int)).drop("ps_car_15", axis = 1)

    # inverse one-hot-encoding for ind_06 % ind_09
    df = df.assign(ps_ind_69_cat = 0*df.ps_ind_06_bin+df.ps_ind_07_bin+2*df.ps_ind_08_bin+3*df.ps_ind_09_bin)
    df.drop(['ps_ind_06_bin','ps_ind_07_bin','ps_ind_08_bin','ps_ind_09_bin'], inplace=True, axis = 1)

    #drop "ind_14"
    df.drop('ps_ind_14', axis = 1, inplace = True)

    return df

In [3]:
params = {'depth': 7, 'l2': 5.5, 'rate': 0.055, 'T': 1.5}

In [4]:
fName = "/tmp/porto/data/train2.pcl"
df = pd.read_pickle(fName)
a = df.drop("target",axis = 1)
b = df.target

getResult = lambda x: trainCatBoost(a, b, x, maxIter=2000, folds=5, verbose= True)
[score, treeList, scoreList, modelList] = getResult(params)

IOError: [Errno 2] No such file or directory: '/tmp/porto/data/train2.pcl'

In [13]:
testDf = pd.read_pickle("/tmp/porto/data/test2.pcl")
testDf.head()

Unnamed: 0_level_0,ps_ind_01,ps_ind_02_cat,ps_ind_03,ps_ind_04_cat,ps_ind_05_cat,ps_ind_06_bin,ps_ind_07_bin,ps_ind_08_bin,ps_ind_09_bin,ps_ind_10_bin,...,ps_car_07_cat,ps_car_08_cat,ps_car_09_cat,ps_car_10_cat,ps_car_11_cat,ps_car_11,ps_car_12,ps_car_13,ps_car_14,ps_car_15
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
0,0,1,8,1,0,0,1,0,0,0,...,1,1,2,1,65,1,0.316228,0.669556,0.352136,3.464102
1,4,2,5,1,0,0,0,0,1,0,...,1,1,0,1,103,1,0.316228,0.60632,0.358329,2.828427
2,5,1,3,0,0,0,0,0,1,0,...,1,1,2,1,29,3,0.4,0.896239,0.398497,3.316625
3,0,1,6,0,0,1,0,0,0,0,...,1,1,2,1,40,2,0.374166,0.65211,0.381445,2.44949
4,5,1,7,0,0,0,0,0,1,0,...,1,1,2,1,101,3,0.374166,0.812914,0.385097,3.316625


In [14]:
testPool = Pool(testDf, feature_names=testDf.columns.tolist())

In [16]:
2*score-1

0.28156419164553737

In [31]:
treeList

[311, 400, 321, 322, 331]

In [21]:
proba = np.ndarray([testDf.shape[0],5]) 
for i, model in enumerate(modelList):
    proba[:,i] = model.predict_proba(testPool)[:,1]

In [24]:
proba.mean(axis=1)

array([ 0.02455887,  0.02626326,  0.0256727 , ...,  0.03349493,
        0.02317673,  0.02941474])

In [28]:
def submit(pred, fName = 'submission.csv'):
    ## make submission file
    df = pd.DataFrame(pred,columns=['target'],index=testDf.index)
    df.to_csv(fName,index_label='id')

In [29]:
submit(proba.mean(axis=1),'submission11.csv')

In [34]:
proba = np.ndarray([testDf.shape[0],5]) 
for seed in range(0,5):

    model = CatBoostClassifier(verbose= True, iterations= 450, thread_count= 4, eval_metric= "AUC",
                               depth= params['depth'], learning_rate= params['rate'],
                               l2_leaf_reg= params['l2'], bagging_temperature= params['T'],
                               random_seed= seed)
    model.fit(df.drop('target',axis=1), df.target)
    proba[:,seed] = model.predict_proba(testPool)[:,1]
    
submit(proba.mean(axis=1),'submission12.csv')    

Borders for float features generated
0:	learn 0.5000934936	total: 1.32s	remaining: 9m 51s
1:	learn 0.5672959221	total: 2.07s	remaining: 7m 44s
2:	learn 0.584546325	total: 2.7s	remaining: 6m 42s
3:	learn 0.5940151299	total: 3.56s	remaining: 6m 36s
4:	learn 0.5971203595	total: 4.33s	remaining: 6m 25s
5:	learn 0.5999253437	total: 5.05s	remaining: 6m 13s
6:	learn 0.6065022303	total: 5.77s	remaining: 6m 5s
7:	learn 0.6056495869	total: 6.51s	remaining: 6m
8:	learn 0.6069375993	total: 7.48s	remaining: 6m 6s
9:	learn 0.6095271382	total: 8.24s	remaining: 6m 2s
10:	learn 0.6102613597	total: 8.92s	remaining: 5m 56s
11:	learn 0.6124226506	total: 9.57s	remaining: 5m 49s
12:	learn 0.6155577105	total: 10.1s	remaining: 5m 39s
13:	learn 0.6181297131	total: 11.8s	remaining: 6m 8s
14:	learn 0.61826191	total: 12.6s	remaining: 6m 4s
15:	learn 0.6206948568	total: 13.7s	remaining: 6m 11s
16:	learn 0.6216294446	total: 14.4s	remaining: 6m 6s
17:	learn 0.6217101168	total: 16.1s	remaining: 6m 25s
18:	learn 0.621

298:	learn 0.6615483077	total: 4m 36s	remaining: 2m 19s
299:	learn 0.6616243297	total: 4m 37s	remaining: 2m 18s
300:	learn 0.6617248708	total: 4m 39s	remaining: 2m 18s
301:	learn 0.6617393932	total: 4m 40s	remaining: 2m 17s
302:	learn 0.6618200026	total: 4m 41s	remaining: 2m 16s
303:	learn 0.6618831566	total: 4m 41s	remaining: 2m 15s
304:	learn 0.6619073996	total: 4m 42s	remaining: 2m 14s
305:	learn 0.6619973847	total: 4m 43s	remaining: 2m 13s
306:	learn 0.6620851615	total: 4m 44s	remaining: 2m 12s
307:	learn 0.6621286883	total: 4m 44s	remaining: 2m 11s
308:	learn 0.6621784788	total: 4m 46s	remaining: 2m 10s
309:	learn 0.6622671898	total: 4m 46s	remaining: 2m 9s
310:	learn 0.662319393	total: 4m 47s	remaining: 2m 8s
311:	learn 0.662418818	total: 4m 48s	remaining: 2m 7s
312:	learn 0.6624875106	total: 4m 49s	remaining: 2m 6s
313:	learn 0.66254871	total: 4m 50s	remaining: 2m 5s
314:	learn 0.6627021706	total: 4m 50s	remaining: 2m 4s
315:	learn 0.6627965901	total: 4m 51s	remaining: 2m 3s
316

447:	learn 0.6710030935	total: 6m 53s	remaining: 1.85s
448:	learn 0.6710237151	total: 6m 54s	remaining: 923ms
449:	learn 0.6711100189	total: 6m 55s	remaining: 0us
Borders for float features generated
0:	learn 0.565882635	total: 852ms	remaining: 6m 22s
1:	learn 0.5801185719	total: 1.55s	remaining: 5m 48s
2:	learn 0.5802060839	total: 1.94s	remaining: 4m 48s
3:	learn 0.5849787811	total: 2.67s	remaining: 4m 57s
4:	learn 0.5933050696	total: 3.36s	remaining: 4m 58s
5:	learn 0.5930679968	total: 4.82s	remaining: 5m 56s
6:	learn 0.6042746501	total: 5.52s	remaining: 5m 49s
7:	learn 0.6078211968	total: 6.23s	remaining: 5m 44s
8:	learn 0.6091700901	total: 8.37s	remaining: 6m 50s
9:	learn 0.6100054967	total: 9.81s	remaining: 7m 11s
10:	learn 0.6098413492	total: 10.4s	remaining: 6m 57s
11:	learn 0.6122821879	total: 11.2s	remaining: 6m 48s
12:	learn 0.6154900502	total: 12.5s	remaining: 6m 58s
13:	learn 0.6163956339	total: 13.1s	remaining: 6m 49s
14:	learn 0.6167153134	total: 14.3s	remaining: 6m 54s
1

148:	learn 0.6485447912	total: 2m 20s	remaining: 4m 43s
149:	learn 0.6487225623	total: 2m 21s	remaining: 4m 43s
150:	learn 0.6487554917	total: 2m 22s	remaining: 4m 41s
151:	learn 0.6487973415	total: 2m 22s	remaining: 4m 40s
152:	learn 0.6488731035	total: 2m 23s	remaining: 4m 38s
153:	learn 0.6490988843	total: 2m 24s	remaining: 4m 37s
154:	learn 0.6492147648	total: 2m 25s	remaining: 4m 36s
155:	learn 0.6492846625	total: 2m 25s	remaining: 4m 34s
156:	learn 0.6493678914	total: 2m 26s	remaining: 4m 33s
157:	learn 0.6494418855	total: 2m 27s	remaining: 4m 32s
158:	learn 0.6496389964	total: 2m 28s	remaining: 4m 31s
159:	learn 0.6497321884	total: 2m 30s	remaining: 4m 32s
160:	learn 0.6497649183	total: 2m 30s	remaining: 4m 30s
161:	learn 0.6498250095	total: 2m 31s	remaining: 4m 29s
162:	learn 0.6499525017	total: 2m 32s	remaining: 4m 28s
163:	learn 0.6501723903	total: 2m 34s	remaining: 4m 28s
164:	learn 0.6502305547	total: 2m 34s	remaining: 4m 27s
165:	learn 0.6502913727	total: 2m 35s	remaining:

296:	learn 0.6621463552	total: 4m 39s	remaining: 2m 23s
297:	learn 0.662193248	total: 4m 39s	remaining: 2m 22s
298:	learn 0.6622572473	total: 4m 40s	remaining: 2m 21s
299:	learn 0.6624548251	total: 4m 41s	remaining: 2m 20s
300:	learn 0.6624982761	total: 4m 42s	remaining: 2m 19s
301:	learn 0.6625824487	total: 4m 42s	remaining: 2m 18s
302:	learn 0.6626236638	total: 4m 43s	remaining: 2m 17s
303:	learn 0.6627320434	total: 4m 44s	remaining: 2m 16s
304:	learn 0.6628070605	total: 4m 46s	remaining: 2m 16s
305:	learn 0.6629000129	total: 4m 46s	remaining: 2m 14s
306:	learn 0.6629539279	total: 4m 47s	remaining: 2m 13s
307:	learn 0.662986053	total: 4m 48s	remaining: 2m 12s
308:	learn 0.6631054217	total: 4m 48s	remaining: 2m 11s
309:	learn 0.6631827068	total: 4m 50s	remaining: 2m 11s
310:	learn 0.6632483438	total: 4m 51s	remaining: 2m 10s
311:	learn 0.663379058	total: 4m 54s	remaining: 2m 10s
312:	learn 0.6634253894	total: 4m 56s	remaining: 2m 9s
313:	learn 0.6635162427	total: 4m 56s	remaining: 2m 

445:	learn 0.6716783011	total: 6m 52s	remaining: 3.7s
446:	learn 0.6717011463	total: 6m 54s	remaining: 2.78s
447:	learn 0.6717915998	total: 6m 54s	remaining: 1.85s
448:	learn 0.6719866468	total: 6m 55s	remaining: 926ms
449:	learn 0.6720301929	total: 6m 57s	remaining: 0us
Borders for float features generated
0:	learn 0.5179561088	total: 489ms	remaining: 3m 39s
1:	learn 0.5811339717	total: 2.1s	remaining: 7m 51s
2:	learn 0.5955492835	total: 2.74s	remaining: 6m 48s
3:	learn 0.6017599027	total: 3.43s	remaining: 6m 22s
4:	learn 0.601885983	total: 4.34s	remaining: 6m 25s
5:	learn 0.6022898114	total: 5.04s	remaining: 6m 12s
6:	learn 0.6052037	total: 5.76s	remaining: 6m 4s
7:	learn 0.6066867585	total: 6.46s	remaining: 5m 56s
8:	learn 0.6111110738	total: 8.56s	remaining: 6m 59s
9:	learn 0.6134171598	total: 9.92s	remaining: 7m 16s
10:	learn 0.6145814048	total: 10.6s	remaining: 7m 4s
11:	learn 0.6185231197	total: 11.4s	remaining: 6m 54s
12:	learn 0.6180317389	total: 12s	remaining: 6m 44s
13:	lear

146:	learn 0.6488783722	total: 2m 13s	remaining: 4m 35s
147:	learn 0.6490719136	total: 2m 15s	remaining: 4m 37s
148:	learn 0.6491464594	total: 2m 17s	remaining: 4m 37s
149:	learn 0.6493086694	total: 2m 19s	remaining: 4m 38s
150:	learn 0.6493783129	total: 2m 20s	remaining: 4m 37s
151:	learn 0.6495757095	total: 2m 20s	remaining: 4m 36s
152:	learn 0.6497179207	total: 2m 21s	remaining: 4m 34s
153:	learn 0.6497938558	total: 2m 22s	remaining: 4m 33s
154:	learn 0.6498388584	total: 2m 23s	remaining: 4m 32s
155:	learn 0.6499458468	total: 2m 23s	remaining: 4m 30s
156:	learn 0.65000436	total: 2m 24s	remaining: 4m 29s
157:	learn 0.6501375117	total: 2m 25s	remaining: 4m 29s
158:	learn 0.6502542331	total: 2m 26s	remaining: 4m 28s
159:	learn 0.650422025	total: 2m 27s	remaining: 4m 26s
160:	learn 0.6505816157	total: 2m 27s	remaining: 4m 25s
161:	learn 0.6506624395	total: 2m 28s	remaining: 4m 24s
162:	learn 0.6508200779	total: 2m 30s	remaining: 4m 24s
163:	learn 0.6509254258	total: 2m 30s	remaining: 4m

294:	learn 0.6623617533	total: 4m 32s	remaining: 2m 23s
295:	learn 0.6624258427	total: 4m 32s	remaining: 2m 21s
296:	learn 0.6625220435	total: 4m 33s	remaining: 2m 20s
297:	learn 0.6626300077	total: 4m 35s	remaining: 2m 20s
298:	learn 0.6627075261	total: 4m 37s	remaining: 2m 20s
299:	learn 0.6627373234	total: 4m 38s	remaining: 2m 19s
300:	learn 0.6628143885	total: 4m 39s	remaining: 2m 18s
301:	learn 0.6628474653	total: 4m 40s	remaining: 2m 17s
302:	learn 0.66291683	total: 4m 40s	remaining: 2m 16s
303:	learn 0.6629918256	total: 4m 41s	remaining: 2m 15s
304:	learn 0.6632169354	total: 4m 42s	remaining: 2m 14s
305:	learn 0.6632979822	total: 4m 42s	remaining: 2m 13s
306:	learn 0.6633515009	total: 4m 43s	remaining: 2m 12s
307:	learn 0.6634190307	total: 4m 44s	remaining: 2m 11s
308:	learn 0.6635221557	total: 4m 45s	remaining: 2m 10s
309:	learn 0.6636614607	total: 4m 46s	remaining: 2m 9s
310:	learn 0.6636987358	total: 4m 46s	remaining: 2m 8s
311:	learn 0.6638197941	total: 4m 47s	remaining: 2m 

443:	learn 0.672037756	total: 6m 48s	remaining: 5.51s
444:	learn 0.6721052909	total: 6m 48s	remaining: 4.59s
445:	learn 0.6721304475	total: 6m 49s	remaining: 3.67s
446:	learn 0.6722108581	total: 6m 50s	remaining: 2.76s
447:	learn 0.6722736038	total: 6m 51s	remaining: 1.84s
448:	learn 0.672301675	total: 6m 52s	remaining: 918ms
449:	learn 0.6723560325	total: 6m 52s	remaining: 0us
Borders for float features generated
0:	learn 0.5589580314	total: 619ms	remaining: 4m 37s
1:	learn 0.5722770417	total: 1.32s	remaining: 4m 56s
2:	learn 0.5906500834	total: 2.11s	remaining: 5m 15s
3:	learn 0.5970101557	total: 2.78s	remaining: 5m 10s
4:	learn 0.5960474142	total: 3.55s	remaining: 5m 16s
5:	learn 0.5987490494	total: 4.21s	remaining: 5m 11s
6:	learn 0.6013351894	total: 4.86s	remaining: 5m 7s
7:	learn 0.6020734272	total: 5.64s	remaining: 5m 11s
8:	learn 0.6069933045	total: 6.34s	remaining: 5m 10s
9:	learn 0.6086626757	total: 7.03s	remaining: 5m 9s
10:	learn 0.6081694919	total: 7.74s	remaining: 5m 9s
1

144:	learn 0.6478844519	total: 2m 9s	remaining: 4m 31s
145:	learn 0.6480066736	total: 2m 9s	remaining: 4m 30s
146:	learn 0.6480017512	total: 2m 10s	remaining: 4m 28s
147:	learn 0.6481350597	total: 2m 11s	remaining: 4m 28s
148:	learn 0.6483125876	total: 2m 12s	remaining: 4m 27s
149:	learn 0.6483734376	total: 2m 13s	remaining: 4m 27s
150:	learn 0.6484836805	total: 2m 15s	remaining: 4m 28s
151:	learn 0.6485341658	total: 2m 16s	remaining: 4m 26s
152:	learn 0.6486015566	total: 2m 16s	remaining: 4m 25s
153:	learn 0.6487035652	total: 2m 17s	remaining: 4m 24s
154:	learn 0.6488050525	total: 2m 18s	remaining: 4m 23s
155:	learn 0.6489190405	total: 2m 19s	remaining: 4m 22s
156:	learn 0.6490193178	total: 2m 21s	remaining: 4m 23s
157:	learn 0.6490502183	total: 2m 22s	remaining: 4m 22s
158:	learn 0.6493197478	total: 2m 22s	remaining: 4m 21s
159:	learn 0.6494720463	total: 2m 23s	remaining: 4m 20s
160:	learn 0.64961892	total: 2m 25s	remaining: 4m 21s
161:	learn 0.6498329411	total: 2m 26s	remaining: 4m 

292:	learn 0.6617600613	total: 4m 28s	remaining: 2m 23s
293:	learn 0.6617842724	total: 4m 29s	remaining: 2m 23s
294:	learn 0.6618789083	total: 4m 30s	remaining: 2m 22s
295:	learn 0.6619311222	total: 4m 31s	remaining: 2m 21s
296:	learn 0.6619959348	total: 4m 32s	remaining: 2m 20s
297:	learn 0.6620120118	total: 4m 32s	remaining: 2m 19s
298:	learn 0.6620833522	total: 4m 33s	remaining: 2m 18s
299:	learn 0.662182579	total: 4m 34s	remaining: 2m 17s
300:	learn 0.6622068822	total: 4m 35s	remaining: 2m 16s
301:	learn 0.6622600646	total: 4m 36s	remaining: 2m 15s
302:	learn 0.6623802145	total: 4m 36s	remaining: 2m 14s
303:	learn 0.6624062182	total: 4m 37s	remaining: 2m 13s
304:	learn 0.6624735309	total: 4m 38s	remaining: 2m 12s
305:	learn 0.6624917338	total: 4m 39s	remaining: 2m 11s
306:	learn 0.6625476675	total: 4m 39s	remaining: 2m 10s
307:	learn 0.6626292457	total: 4m 40s	remaining: 2m 9s
308:	learn 0.6626864009	total: 4m 41s	remaining: 2m 8s
309:	learn 0.662878953	total: 4m 41s	remaining: 2m 

441:	learn 0.6715042359	total: 6m 45s	remaining: 7.34s
442:	learn 0.6715085518	total: 6m 46s	remaining: 6.42s
443:	learn 0.6715488667	total: 6m 46s	remaining: 5.5s
444:	learn 0.6715853464	total: 6m 47s	remaining: 4.58s
445:	learn 0.6716323689	total: 6m 48s	remaining: 3.66s
446:	learn 0.6716823602	total: 6m 49s	remaining: 2.75s
447:	learn 0.6717218128	total: 6m 50s	remaining: 1.83s
448:	learn 0.6717684577	total: 6m 51s	remaining: 915ms
449:	learn 0.6718109054	total: 6m 51s	remaining: 0us
Borders for float features generated
0:	learn 0.5761797828	total: 2.57s	remaining: 19m 13s
1:	learn 0.5956832908	total: 4.37s	remaining: 16m 19s
2:	learn 0.5999237845	total: 5.02s	remaining: 12m 28s
3:	learn 0.6010781133	total: 5.72s	remaining: 10m 38s
4:	learn 0.6059915704	total: 6.46s	remaining: 9m 35s
5:	learn 0.6088876362	total: 7.17s	remaining: 8m 51s
6:	learn 0.6129046177	total: 7.96s	remaining: 8m 24s
7:	learn 0.6171366659	total: 9.34s	remaining: 8m 36s
8:	learn 0.6209919284	total: 10s	remaining:

142:	learn 0.6492966	total: 2m 17s	remaining: 4m 55s
143:	learn 0.6497389712	total: 2m 18s	remaining: 4m 54s
144:	learn 0.6498330276	total: 2m 19s	remaining: 4m 52s
145:	learn 0.6498813242	total: 2m 19s	remaining: 4m 51s
146:	learn 0.6499359915	total: 2m 20s	remaining: 4m 50s
147:	learn 0.649971393	total: 2m 21s	remaining: 4m 49s
148:	learn 0.6500928833	total: 2m 22s	remaining: 4m 48s
149:	learn 0.6501897945	total: 2m 23s	remaining: 4m 47s
150:	learn 0.6503453984	total: 2m 24s	remaining: 4m 45s
151:	learn 0.6504243113	total: 2m 25s	remaining: 4m 44s
152:	learn 0.6505406206	total: 2m 26s	remaining: 4m 45s
153:	learn 0.6506631841	total: 2m 27s	remaining: 4m 43s
154:	learn 0.6507763363	total: 2m 28s	remaining: 4m 42s
155:	learn 0.6510000296	total: 2m 29s	remaining: 4m 41s
156:	learn 0.651080015	total: 2m 30s	remaining: 4m 40s
157:	learn 0.6511414977	total: 2m 31s	remaining: 4m 39s
158:	learn 0.6512539258	total: 2m 32s	remaining: 4m 38s
159:	learn 0.6513906196	total: 2m 32s	remaining: 4m 3

290:	learn 0.6623621557	total: 4m 31s	remaining: 2m 28s
291:	learn 0.6624316139	total: 4m 31s	remaining: 2m 27s
292:	learn 0.6624768073	total: 4m 32s	remaining: 2m 26s
293:	learn 0.662562985	total: 4m 33s	remaining: 2m 25s
294:	learn 0.6626007418	total: 4m 34s	remaining: 2m 24s
295:	learn 0.6627184799	total: 4m 36s	remaining: 2m 23s
296:	learn 0.6628317203	total: 4m 36s	remaining: 2m 22s
297:	learn 0.6628516117	total: 4m 37s	remaining: 2m 21s
298:	learn 0.662918982	total: 4m 38s	remaining: 2m 20s
299:	learn 0.6629746108	total: 4m 39s	remaining: 2m 19s
300:	learn 0.6630268071	total: 4m 40s	remaining: 2m 18s
301:	learn 0.6631250151	total: 4m 41s	remaining: 2m 17s
302:	learn 0.663148318	total: 4m 42s	remaining: 2m 16s
303:	learn 0.6631701631	total: 4m 42s	remaining: 2m 15s
304:	learn 0.6632163002	total: 4m 43s	remaining: 2m 14s
305:	learn 0.6632226738	total: 4m 44s	remaining: 2m 13s
306:	learn 0.6632623215	total: 4m 45s	remaining: 2m 12s
307:	learn 0.6633218295	total: 4m 46s	remaining: 2m

439:	learn 0.672082484	total: 6m 55s	remaining: 9.44s
440:	learn 0.6721311294	total: 6m 56s	remaining: 8.49s
441:	learn 0.6721935741	total: 6m 56s	remaining: 7.54s
442:	learn 0.6722617747	total: 6m 57s	remaining: 6.6s
443:	learn 0.6723351475	total: 6m 58s	remaining: 5.65s
444:	learn 0.6724074442	total: 6m 58s	remaining: 4.71s
445:	learn 0.6724803401	total: 7m	remaining: 3.77s
446:	learn 0.6725049347	total: 7m 2s	remaining: 2.83s
447:	learn 0.6725573666	total: 7m 2s	remaining: 1.89s
448:	learn 0.6726688342	total: 7m 3s	remaining: 944ms
449:	learn 0.6727126071	total: 7m 4s	remaining: 0us


Скор 0.279

In [43]:
# Распарсим имена фич и все с суффиксом cat запишем в категориальные, получим их номера и будем 

def getCatFeatures(featureList):
    '''
    featureList is list of features name (df.columns.tolist())
    '''
    catFeatures = []
    for featureInd, featureName in enumerate(featureList):
        if featureName[-3:] == 'cat':
            catFeatures.append(featureInd)
            
    return catFeatures   

In [40]:
proba = np.ndarray([testDf.shape[0],5]) 
for seed in range(0,5):

    model = CatBoostClassifier(verbose= True, iterations= 550, thread_count= 4, eval_metric= "AUC",
                               depth= params['depth'], learning_rate= params['rate'],
                               l2_leaf_reg= params['l2'], bagging_temperature= params['T'],
                               random_seed= seed)
    model.fit(df.drop('target',axis=1), df.target)
    proba[:,seed] = model.predict_proba(testPool)[:,1]
    
submit(proba.mean(axis=1),'submission13.csv')    

Borders for float features generated
0:	learn 0.5000934936	total: 499ms	remaining: 4m 34s
1:	learn 0.5672959221	total: 1.27s	remaining: 5m 47s
2:	learn 0.584546325	total: 1.96s	remaining: 5m 57s
3:	learn 0.5940151299	total: 3.2s	remaining: 7m 17s
4:	learn 0.5971203595	total: 3.85s	remaining: 6m 59s
5:	learn 0.5999253437	total: 4.54s	remaining: 6m 52s
6:	learn 0.6065022303	total: 5.4s	remaining: 6m 59s
7:	learn 0.6056495869	total: 6.15s	remaining: 6m 56s
8:	learn 0.6069375993	total: 6.91s	remaining: 6m 55s
9:	learn 0.6095271382	total: 8.07s	remaining: 7m 16s
10:	learn 0.6102613597	total: 8.72s	remaining: 7m 7s
11:	learn 0.6124226506	total: 9.45s	remaining: 7m 3s
12:	learn 0.6155577105	total: 10.1s	remaining: 6m 56s
13:	learn 0.6181297131	total: 11.5s	remaining: 7m 21s
14:	learn 0.61826191	total: 12.2s	remaining: 7m 15s
15:	learn 0.6206948568	total: 12.9s	remaining: 7m 10s
16:	learn 0.6216294446	total: 13.7s	remaining: 7m 8s
17:	learn 0.6217101168	total: 14.4s	remaining: 7m 5s
18:	learn 

151:	learn 0.648751842	total: 2m 15s	remaining: 5m 56s
152:	learn 0.6488272353	total: 2m 16s	remaining: 5m 54s
153:	learn 0.6488827557	total: 2m 17s	remaining: 5m 53s
154:	learn 0.6489581806	total: 2m 18s	remaining: 5m 53s
155:	learn 0.6491606731	total: 2m 19s	remaining: 5m 52s
156:	learn 0.6493036862	total: 2m 20s	remaining: 5m 51s
157:	learn 0.6494229425	total: 2m 21s	remaining: 5m 49s
158:	learn 0.6495846083	total: 2m 21s	remaining: 5m 48s
159:	learn 0.6496682639	total: 2m 22s	remaining: 5m 47s
160:	learn 0.6497186627	total: 2m 23s	remaining: 5m 46s
161:	learn 0.6498475302	total: 2m 23s	remaining: 5m 44s
162:	learn 0.6499170963	total: 2m 24s	remaining: 5m 43s
163:	learn 0.6499319463	total: 2m 26s	remaining: 5m 44s
164:	learn 0.6500113033	total: 2m 27s	remaining: 5m 43s
165:	learn 0.6500970842	total: 2m 27s	remaining: 5m 42s
166:	learn 0.6502062172	total: 2m 28s	remaining: 5m 41s
167:	learn 0.6502467013	total: 2m 29s	remaining: 5m 40s
168:	learn 0.6503561722	total: 2m 30s	remaining: 

299:	learn 0.6616243297	total: 4m 41s	remaining: 3m 54s
300:	learn 0.6617248708	total: 4m 43s	remaining: 3m 54s
301:	learn 0.6617393932	total: 4m 45s	remaining: 3m 54s
302:	learn 0.6618200026	total: 4m 45s	remaining: 3m 53s
303:	learn 0.6618831566	total: 4m 46s	remaining: 3m 51s
304:	learn 0.6619073996	total: 4m 47s	remaining: 3m 50s
305:	learn 0.6619973847	total: 4m 49s	remaining: 3m 50s
306:	learn 0.6620851615	total: 4m 51s	remaining: 3m 50s
307:	learn 0.6621286883	total: 4m 52s	remaining: 3m 49s
308:	learn 0.6621784788	total: 4m 52s	remaining: 3m 48s
309:	learn 0.6622671898	total: 4m 54s	remaining: 3m 47s
310:	learn 0.662319393	total: 4m 55s	remaining: 3m 46s
311:	learn 0.662418818	total: 4m 55s	remaining: 3m 45s
312:	learn 0.6624875106	total: 4m 57s	remaining: 3m 45s
313:	learn 0.66254871	total: 4m 58s	remaining: 3m 44s
314:	learn 0.6627021706	total: 4m 59s	remaining: 3m 43s
315:	learn 0.6627965901	total: 5m 1s	remaining: 3m 43s
316:	learn 0.6628368303	total: 5m 2s	remaining: 3m 42

447:	learn 0.6710030935	total: 7m 10s	remaining: 1m 37s
448:	learn 0.6710237151	total: 7m 11s	remaining: 1m 37s
449:	learn 0.6711100189	total: 7m 13s	remaining: 1m 36s
450:	learn 0.6711434809	total: 7m 14s	remaining: 1m 35s
451:	learn 0.671234552	total: 7m 15s	remaining: 1m 34s
452:	learn 0.6713008983	total: 7m 16s	remaining: 1m 33s
453:	learn 0.6713328707	total: 7m 17s	remaining: 1m 32s
454:	learn 0.671371758	total: 7m 17s	remaining: 1m 31s
455:	learn 0.6714363056	total: 7m 19s	remaining: 1m 30s
456:	learn 0.6715165581	total: 7m 20s	remaining: 1m 29s
457:	learn 0.6715367936	total: 7m 20s	remaining: 1m 28s
458:	learn 0.6715952602	total: 7m 21s	remaining: 1m 27s
459:	learn 0.6716474586	total: 7m 22s	remaining: 1m 26s
460:	learn 0.6716937021	total: 7m 23s	remaining: 1m 25s
461:	learn 0.6717530271	total: 7m 24s	remaining: 1m 24s
462:	learn 0.671810012	total: 7m 24s	remaining: 1m 23s
463:	learn 0.6718435003	total: 7m 25s	remaining: 1m 22s
464:	learn 0.6718772919	total: 7m 26s	remaining: 1m

47:	learn 0.632763899	total: 42.7s	remaining: 7m 26s
48:	learn 0.6328871381	total: 43.5s	remaining: 7m 24s
49:	learn 0.633284006	total: 44.2s	remaining: 7m 22s
50:	learn 0.6337813806	total: 45.4s	remaining: 7m 24s
51:	learn 0.6345411397	total: 46.2s	remaining: 7m 22s
52:	learn 0.634400131	total: 46.9s	remaining: 7m 19s
53:	learn 0.6349320469	total: 47.6s	remaining: 7m 17s
54:	learn 0.6354301896	total: 48.3s	remaining: 7m 14s
55:	learn 0.6354487173	total: 49.1s	remaining: 7m 12s
56:	learn 0.6356839314	total: 49.8s	remaining: 7m 10s
57:	learn 0.635812651	total: 50.9s	remaining: 7m 12s
58:	learn 0.636014589	total: 51.7s	remaining: 7m 10s
59:	learn 0.636047151	total: 52.4s	remaining: 7m 8s
60:	learn 0.6361479812	total: 53.2s	remaining: 7m 6s
61:	learn 0.6363588476	total: 54.1s	remaining: 7m 6s
62:	learn 0.6365020158	total: 55.6s	remaining: 7m 9s
63:	learn 0.6368576328	total: 57.3s	remaining: 7m 14s
64:	learn 0.6369321049	total: 58.4s	remaining: 7m 15s
65:	learn 0.6370780323	total: 59.2s	re

197:	learn 0.6538193817	total: 3m 6s	remaining: 5m 30s
198:	learn 0.6539067848	total: 3m 8s	remaining: 5m 31s
199:	learn 0.6539999219	total: 3m 9s	remaining: 5m 31s
200:	learn 0.6542961062	total: 3m 9s	remaining: 5m 29s
201:	learn 0.6544276258	total: 3m 11s	remaining: 5m 29s
202:	learn 0.6544596075	total: 3m 12s	remaining: 5m 28s
203:	learn 0.6545809689	total: 3m 13s	remaining: 5m 27s
204:	learn 0.6546890632	total: 3m 13s	remaining: 5m 26s
205:	learn 0.6547530656	total: 3m 14s	remaining: 5m 24s
206:	learn 0.6547889568	total: 3m 15s	remaining: 5m 23s
207:	learn 0.6548662078	total: 3m 16s	remaining: 5m 22s
208:	learn 0.6549151417	total: 3m 16s	remaining: 5m 21s
209:	learn 0.6549740132	total: 3m 17s	remaining: 5m 20s
210:	learn 0.6550779647	total: 3m 18s	remaining: 5m 18s
211:	learn 0.6552259174	total: 3m 19s	remaining: 5m 17s
212:	learn 0.6553439137	total: 3m 19s	remaining: 5m 16s
213:	learn 0.6553826958	total: 3m 20s	remaining: 5m 14s
214:	learn 0.6555011212	total: 3m 21s	remaining: 5m 

345:	learn 0.6656369532	total: 5m 30s	remaining: 3m 14s
346:	learn 0.6656697211	total: 5m 31s	remaining: 3m 13s
347:	learn 0.665687921	total: 5m 32s	remaining: 3m 12s
348:	learn 0.6657344886	total: 5m 33s	remaining: 3m 11s
349:	learn 0.6658471894	total: 5m 33s	remaining: 3m 10s
350:	learn 0.6659047899	total: 5m 35s	remaining: 3m 10s
351:	learn 0.6659280561	total: 5m 36s	remaining: 3m 9s
352:	learn 0.6659896641	total: 5m 37s	remaining: 3m 8s
353:	learn 0.6660601176	total: 5m 38s	remaining: 3m 7s
354:	learn 0.6661292681	total: 5m 39s	remaining: 3m 6s
355:	learn 0.6661548839	total: 5m 39s	remaining: 3m 5s
356:	learn 0.6662095593	total: 5m 40s	remaining: 3m 4s
357:	learn 0.6662503333	total: 5m 41s	remaining: 3m 3s
358:	learn 0.666354533	total: 5m 42s	remaining: 3m 2s
359:	learn 0.6663661518	total: 5m 43s	remaining: 3m 1s
360:	learn 0.6664482474	total: 5m 43s	remaining: 3m
361:	learn 0.666544322	total: 5m 44s	remaining: 2m 58s
362:	learn 0.6665871396	total: 5m 45s	remaining: 2m 57s
363:	lea

493:	learn 0.6746219252	total: 7m 45s	remaining: 52.7s
494:	learn 0.6746670445	total: 7m 46s	remaining: 51.8s
495:	learn 0.6746946094	total: 7m 47s	remaining: 50.8s
496:	learn 0.6747349438	total: 7m 47s	remaining: 49.9s
497:	learn 0.6748212242	total: 7m 48s	remaining: 48.9s
498:	learn 0.6748902631	total: 7m 50s	remaining: 48.1s
499:	learn 0.6749454628	total: 7m 51s	remaining: 47.2s
500:	learn 0.6749705366	total: 7m 52s	remaining: 46.2s
501:	learn 0.6750694772	total: 7m 53s	remaining: 45.2s
502:	learn 0.6751460818	total: 7m 53s	remaining: 44.3s
503:	learn 0.675244043	total: 7m 54s	remaining: 43.3s
504:	learn 0.6753078377	total: 7m 55s	remaining: 42.4s
505:	learn 0.6753488707	total: 7m 56s	remaining: 41.4s
506:	learn 0.6754182454	total: 7m 56s	remaining: 40.4s
507:	learn 0.6754614837	total: 7m 58s	remaining: 39.6s
508:	learn 0.6755274033	total: 7m 59s	remaining: 38.6s
509:	learn 0.6755402854	total: 8m	remaining: 37.7s
510:	learn 0.6756000452	total: 8m 2s	remaining: 36.8s
511:	learn 0.675

95:	learn 0.6426462423	total: 1m 28s	remaining: 6m 57s
96:	learn 0.6427870708	total: 1m 29s	remaining: 6m 57s
97:	learn 0.642829097	total: 1m 30s	remaining: 6m 55s
98:	learn 0.6429347392	total: 1m 31s	remaining: 6m 54s
99:	learn 0.6431285353	total: 1m 31s	remaining: 6m 53s
100:	learn 0.6433598134	total: 1m 32s	remaining: 6m 51s
101:	learn 0.643378735	total: 1m 33s	remaining: 6m 52s
102:	learn 0.6434375744	total: 1m 35s	remaining: 6m 55s
103:	learn 0.6435593633	total: 1m 36s	remaining: 6m 53s
104:	learn 0.643731375	total: 1m 37s	remaining: 6m 51s
105:	learn 0.6439048052	total: 1m 37s	remaining: 6m 49s
106:	learn 0.6439673243	total: 1m 38s	remaining: 6m 48s
107:	learn 0.6441490497	total: 1m 40s	remaining: 6m 49s
108:	learn 0.6442733643	total: 1m 41s	remaining: 6m 52s
109:	learn 0.6445545739	total: 1m 42s	remaining: 6m 50s
110:	learn 0.6446248443	total: 1m 43s	remaining: 6m 48s
111:	learn 0.6447113366	total: 1m 44s	remaining: 6m 47s
112:	learn 0.6448129978	total: 1m 44s	remaining: 6m 45s


243:	learn 0.6581614655	total: 3m 48s	remaining: 4m 47s
244:	learn 0.6582838218	total: 3m 49s	remaining: 4m 45s
245:	learn 0.658342705	total: 3m 50s	remaining: 4m 44s
246:	learn 0.6583942755	total: 3m 51s	remaining: 4m 43s
247:	learn 0.6585943675	total: 3m 52s	remaining: 4m 42s
248:	learn 0.6586590339	total: 3m 52s	remaining: 4m 41s
249:	learn 0.658725884	total: 3m 53s	remaining: 4m 40s
250:	learn 0.6588020248	total: 3m 54s	remaining: 4m 39s
251:	learn 0.6588819824	total: 3m 55s	remaining: 4m 38s
252:	learn 0.658963716	total: 3m 55s	remaining: 4m 36s
253:	learn 0.6591241676	total: 3m 56s	remaining: 4m 35s
254:	learn 0.6592247316	total: 3m 57s	remaining: 4m 34s
255:	learn 0.6593642174	total: 3m 57s	remaining: 4m 33s
256:	learn 0.6594305809	total: 3m 58s	remaining: 4m 31s
257:	learn 0.6594984867	total: 3m 59s	remaining: 4m 30s
258:	learn 0.6596166603	total: 3m 59s	remaining: 4m 29s
259:	learn 0.6597406738	total: 4m 1s	remaining: 4m 28s
260:	learn 0.6597860138	total: 4m 1s	remaining: 4m 2

391:	learn 0.6690702914	total: 6m 8s	remaining: 2m 28s
392:	learn 0.6691071865	total: 6m 9s	remaining: 2m 27s
393:	learn 0.6691510856	total: 6m 10s	remaining: 2m 26s
394:	learn 0.6692157231	total: 6m 12s	remaining: 2m 26s
395:	learn 0.6692887792	total: 6m 14s	remaining: 2m 25s
396:	learn 0.6693249707	total: 6m 15s	remaining: 2m 24s
397:	learn 0.6693826439	total: 6m 16s	remaining: 2m 23s
398:	learn 0.6694382963	total: 6m 16s	remaining: 2m 22s
399:	learn 0.6694911339	total: 6m 18s	remaining: 2m 21s
400:	learn 0.6695847201	total: 6m 19s	remaining: 2m 20s
401:	learn 0.6696422082	total: 6m 19s	remaining: 2m 19s
402:	learn 0.6696904632	total: 6m 20s	remaining: 2m 18s
403:	learn 0.6697417926	total: 6m 22s	remaining: 2m 18s
404:	learn 0.6698704105	total: 6m 23s	remaining: 2m 17s
405:	learn 0.6699262523	total: 6m 24s	remaining: 2m 16s
406:	learn 0.6699490921	total: 6m 26s	remaining: 2m 15s
407:	learn 0.6699667017	total: 6m 27s	remaining: 2m 14s
408:	learn 0.6700427715	total: 6m 29s	remaining: 2

540:	learn 0.6773098425	total: 8m 33s	remaining: 8.54s
541:	learn 0.6773443256	total: 8m 34s	remaining: 7.59s
542:	learn 0.677386957	total: 8m 34s	remaining: 6.64s
543:	learn 0.6774147296	total: 8m 35s	remaining: 5.69s
544:	learn 0.6775014029	total: 8m 36s	remaining: 4.74s
545:	learn 0.6775294458	total: 8m 37s	remaining: 3.79s
546:	learn 0.6775583096	total: 8m 38s	remaining: 2.84s
547:	learn 0.6776103661	total: 8m 39s	remaining: 1.9s
548:	learn 0.677679382	total: 8m 40s	remaining: 947ms
549:	learn 0.6777049538	total: 8m 40s	remaining: 0us
Borders for float features generated
0:	learn 0.5589580314	total: 1.62s	remaining: 14m 50s
1:	learn 0.5722770417	total: 2.33s	remaining: 10m 37s
2:	learn 0.5906500834	total: 3.01s	remaining: 9m 8s
3:	learn 0.5970101557	total: 5.24s	remaining: 11m 55s
4:	learn 0.5960474142	total: 7.87s	remaining: 14m 17s
5:	learn 0.5987490494	total: 8.66s	remaining: 13m 4s
6:	learn 0.6013351894	total: 9.65s	remaining: 12m 28s
7:	learn 0.6020734272	total: 11.6s	remainin

140:	learn 0.6473963708	total: 2m 19s	remaining: 6m 44s
141:	learn 0.6476413141	total: 2m 20s	remaining: 6m 42s
142:	learn 0.6477506946	total: 2m 21s	remaining: 6m 43s
143:	learn 0.6478214635	total: 2m 22s	remaining: 6m 42s
144:	learn 0.6478844519	total: 2m 23s	remaining: 6m 40s
145:	learn 0.6480066736	total: 2m 24s	remaining: 6m 38s
146:	learn 0.6480017512	total: 2m 24s	remaining: 6m 36s
147:	learn 0.6481350597	total: 2m 25s	remaining: 6m 34s
148:	learn 0.6483125876	total: 2m 26s	remaining: 6m 33s
149:	learn 0.6483734376	total: 2m 27s	remaining: 6m 33s
150:	learn 0.6484836805	total: 2m 28s	remaining: 6m 32s
151:	learn 0.6485341658	total: 2m 29s	remaining: 6m 30s
152:	learn 0.6486015566	total: 2m 30s	remaining: 6m 29s
153:	learn 0.6487035652	total: 2m 30s	remaining: 6m 28s
154:	learn 0.6488050525	total: 2m 32s	remaining: 6m 28s
155:	learn 0.6489190405	total: 2m 33s	remaining: 6m 27s
156:	learn 0.6490193178	total: 2m 34s	remaining: 6m 25s
157:	learn 0.6490502183	total: 2m 34s	remaining:

288:	learn 0.6615031622	total: 4m 34s	remaining: 4m 8s
289:	learn 0.6615714717	total: 4m 35s	remaining: 4m 6s
290:	learn 0.6616687119	total: 4m 37s	remaining: 4m 7s
291:	learn 0.6617202745	total: 4m 38s	remaining: 4m 5s
292:	learn 0.6617600613	total: 4m 39s	remaining: 4m 4s
293:	learn 0.6617842724	total: 4m 39s	remaining: 4m 3s
294:	learn 0.6618789083	total: 4m 40s	remaining: 4m 2s
295:	learn 0.6619311222	total: 4m 41s	remaining: 4m 1s
296:	learn 0.6619959348	total: 4m 42s	remaining: 4m
297:	learn 0.6620120118	total: 4m 43s	remaining: 3m 59s
298:	learn 0.6620833522	total: 4m 44s	remaining: 3m 58s
299:	learn 0.662182579	total: 4m 45s	remaining: 3m 58s
300:	learn 0.6622068822	total: 4m 46s	remaining: 3m 56s
301:	learn 0.6622600646	total: 4m 48s	remaining: 3m 56s
302:	learn 0.6623802145	total: 4m 48s	remaining: 3m 55s
303:	learn 0.6624062182	total: 4m 49s	remaining: 3m 54s
304:	learn 0.6624735309	total: 4m 50s	remaining: 3m 53s
305:	learn 0.6624917338	total: 4m 50s	remaining: 3m 51s
306:	

436:	learn 0.6711992156	total: 6m 48s	remaining: 1m 45s
437:	learn 0.671219803	total: 6m 49s	remaining: 1m 44s
438:	learn 0.6712727832	total: 6m 49s	remaining: 1m 43s
439:	learn 0.671363219	total: 6m 50s	remaining: 1m 42s
440:	learn 0.6714356952	total: 6m 51s	remaining: 1m 41s
441:	learn 0.6715042359	total: 6m 52s	remaining: 1m 40s
442:	learn 0.6715085518	total: 6m 54s	remaining: 1m 40s
443:	learn 0.6715488667	total: 6m 54s	remaining: 1m 39s
444:	learn 0.6715853464	total: 6m 55s	remaining: 1m 38s
445:	learn 0.6716323689	total: 6m 56s	remaining: 1m 37s
446:	learn 0.6716823602	total: 6m 57s	remaining: 1m 36s
447:	learn 0.6717218128	total: 6m 57s	remaining: 1m 35s
448:	learn 0.6717684577	total: 6m 59s	remaining: 1m 34s
449:	learn 0.6718109054	total: 6m 59s	remaining: 1m 33s
450:	learn 0.6718461725	total: 7m	remaining: 1m 32s
451:	learn 0.6718674475	total: 7m 1s	remaining: 1m 31s
452:	learn 0.671883096	total: 7m 1s	remaining: 1m 30s
453:	learn 0.671916027	total: 7m 2s	remaining: 1m 29s
454

36:	learn 0.6315572886	total: 34.4s	remaining: 7m 57s
37:	learn 0.6316631943	total: 36.2s	remaining: 8m 7s
38:	learn 0.6320168612	total: 37.9s	remaining: 8m 16s
39:	learn 0.6321526101	total: 38.6s	remaining: 8m 12s
40:	learn 0.6325636717	total: 39.3s	remaining: 8m 8s
41:	learn 0.6327617193	total: 40.1s	remaining: 8m 5s
42:	learn 0.6329237705	total: 40.8s	remaining: 8m 1s
43:	learn 0.6333234228	total: 41.6s	remaining: 7m 57s
44:	learn 0.6336231575	total: 42.3s	remaining: 7m 55s
45:	learn 0.6337576683	total: 43.4s	remaining: 7m 55s
46:	learn 0.6339525106	total: 44.1s	remaining: 7m 51s
47:	learn 0.6342449805	total: 44.8s	remaining: 7m 48s
48:	learn 0.6342909879	total: 45.5s	remaining: 7m 45s
49:	learn 0.634361989	total: 47.3s	remaining: 7m 52s
50:	learn 0.634329198	total: 48s	remaining: 7m 50s
51:	learn 0.6347124031	total: 48.8s	remaining: 7m 46s
52:	learn 0.6350362348	total: 49.5s	remaining: 7m 44s
53:	learn 0.6351842447	total: 50.2s	remaining: 7m 41s
54:	learn 0.6354034041	total: 51s	re

333:	learn 0.6651147305	total: 5m 10s	remaining: 3m 20s
334:	learn 0.6651603554	total: 5m 11s	remaining: 3m 19s
335:	learn 0.6652622262	total: 5m 11s	remaining: 3m 18s
336:	learn 0.66527217	total: 5m 12s	remaining: 3m 17s
337:	learn 0.665389557	total: 5m 13s	remaining: 3m 16s
338:	learn 0.6654371568	total: 5m 14s	remaining: 3m 15s
339:	learn 0.6654999174	total: 5m 15s	remaining: 3m 14s
340:	learn 0.6655250288	total: 5m 16s	remaining: 3m 13s
341:	learn 0.6656026102	total: 5m 16s	remaining: 3m 12s
342:	learn 0.6656696471	total: 5m 17s	remaining: 3m 11s
343:	learn 0.6657419066	total: 5m 18s	remaining: 3m 10s
344:	learn 0.665796701	total: 5m 18s	remaining: 3m 9s
345:	learn 0.6658564768	total: 5m 19s	remaining: 3m 8s
346:	learn 0.6659574142	total: 5m 20s	remaining: 3m 7s
347:	learn 0.6660061053	total: 5m 21s	remaining: 3m 6s
348:	learn 0.6661074678	total: 5m 21s	remaining: 3m 5s
349:	learn 0.6661342971	total: 5m 23s	remaining: 3m 4s
350:	learn 0.6661688606	total: 5m 24s	remaining: 3m 3s
351

481:	learn 0.6744259443	total: 7m 17s	remaining: 1m 1s
482:	learn 0.6744742615	total: 7m 18s	remaining: 1m
483:	learn 0.674483127	total: 7m 20s	remaining: 1m
484:	learn 0.6745661324	total: 7m 21s	remaining: 59.2s
485:	learn 0.6745865718	total: 7m 22s	remaining: 58.2s
486:	learn 0.6746184964	total: 7m 22s	remaining: 57.3s
487:	learn 0.6746699072	total: 7m 23s	remaining: 56.4s
488:	learn 0.6747659178	total: 7m 24s	remaining: 55.4s
489:	learn 0.6748861542	total: 7m 24s	remaining: 54.5s
490:	learn 0.6749216058	total: 7m 25s	remaining: 53.6s
491:	learn 0.6749957321	total: 7m 26s	remaining: 52.6s
492:	learn 0.675114924	total: 7m 27s	remaining: 51.7s
493:	learn 0.6751363951	total: 7m 27s	remaining: 50.8s
494:	learn 0.6751660008	total: 7m 28s	remaining: 49.9s
495:	learn 0.6752300368	total: 7m 29s	remaining: 48.9s
496:	learn 0.6752525142	total: 7m 30s	remaining: 48s
497:	learn 0.6753087215	total: 7m 30s	remaining: 47.1s
498:	learn 0.6753538069	total: 7m 31s	remaining: 46.2s
499:	learn 0.6753747

Скор 0.279

In [50]:
proba = np.ndarray([testDf.shape[0],5]) 
for seed in range(0,5):
    print 'Iteration #', seed
    model = CatBoostClassifier(verbose= False, iterations= 700, thread_count= 4, eval_metric= "AUC",
                               depth= params['depth'], learning_rate= params['rate'],
                               l2_leaf_reg= params['l2'], bagging_temperature= params['T'],
                               random_seed= seed)
    print 'Learn'
    model.fit( Pool(df.drop('target',axis=1), df.target,
                    feature_names= df.columns.tolist(),
                    cat_features= getCatFeatures(df.drop('target',axis=1).columns.tolist())
                   )
             )
    print 'Trees number is ', model.tree_count_
    proba[:,seed] = model.predict_proba(  Pool(testDf,
                                               feature_names=testDf.columns.tolist(),
                                               cat_features= getCatFeatures(testDf.columns.tolist())
                                              )
                                       )[:,1]
    
submit(proba.mean(axis=1),'submission15.csv')    

Iteration # 0
Learn
Trees number is  700
Iteration # 1
Learn
Trees number is  700
Iteration # 2
Learn
Trees number is  700
Iteration # 3
Learn
Trees number is  700
Iteration # 4
Learn
Trees number is  700


Скор 0.278