# Libraries

In [1]:
import json
import pandas as pd

from nltk.tokenize import RegexpTokenizer

import gc
from thefuzz import fuzz
import numpy as np
from tqdm.auto import tqdm

from catboost import CatBoostClassifier, Pool

import warnings

In [2]:
pd.set_option('display.max_columns', 256)
warnings.filterwarnings('ignore')

# Data

In [3]:
train_pairs = pd.read_parquet('./datasets/train_pairs_w_target.parquet')
train_pairs['target'] = train_pairs['target'].astype(int)
rtrain_pairs = train_pairs.copy()
rtrain_pairs.variantid1, rtrain_pairs.variantid2 = rtrain_pairs.variantid2, rtrain_pairs.variantid1
train_pairs

Unnamed: 0,target,variantid1,variantid2
0,0,51197862,51198054
1,1,53062686,536165289
2,1,53602615,587809782
3,1,53888651,89598677
4,0,56930698,551526166
...,...,...,...
306535,0,817327230,822083612
306536,0,817560551,818069912
306537,0,817854719,817857267
306538,0,820036017,820037019


In [4]:
test_pairs = pd.read_parquet('./datasets/test_pairs_wo_target.parquet')
rtest_pairs = test_pairs.copy()
rtest_pairs.variantid1, rtest_pairs.variantid2 = rtest_pairs.variantid2, rtest_pairs.variantid1
test_pairs

Unnamed: 0,variantid1,variantid2
0,52076340,290590137
1,64525522,204128919
2,77243372,479860557
3,86065820,540678372
4,91566575,258840506
...,...,...
18079,666998614,667074522
18080,670036240,670048449
18081,670284509,684323809
18082,692172005,704805270


In [6]:
train_data = pd.read_parquet('./datasets/train_data.parquet').set_index('variantid')
train_data['characteristic_attributes_mapping'] = train_data['characteristic_attributes_mapping'].fillna('{}').apply(lambda x: json.loads(x))
train_data['categories'] = train_data['categories'].apply(lambda x: json.loads(x))
train_data['main_pic_embeddings_resnet_v1'] = train_data['main_pic_embeddings_resnet_v1'].apply(lambda x: x[0])
train_data = pd.concat([train_data, pd.read_parquet('./datasets/name_labse_embs_train.parquet').set_index('variantid')], axis=1)
train_data = pd.concat([train_data, pd.read_pickle('./datasets/neuro_embeds_train.pickle')], axis=1)
train_data

Unnamed: 0_level_0,name,categories,color_parsed,pic_embeddings_resnet_v1,main_pic_embeddings_resnet_v1,name_bert_64,characteristic_attributes_mapping,name_labse_768,neuro_768
variantid,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
51195767,"Удлинитель Партнер-Электро ПВС 2х0,75 ГОСТ,6A,...","{'1': 'EPG', '2': 'Электроника', '3': 'Сетевые...",[оранжевый],,"[0.04603629, 0.18839523, -0.09973055, -0.66368...","[-0.47045058, 0.67237014, 0.48984158, -0.54485...","{'Номинальный ток, А': ['10'], 'Цвет товара': ...","[-0.033874325, 0.03722446, 0.0029757991, 0.068...","[0.05308385, -0.035102457, 0.035711396, -0.003..."
53565809,Магнитный кабель USB 2.0 A (m) - USB Type-C (m...,"{'1': 'EPG', '2': 'Электроника', '3': 'Кабели ...",[красный],"[[0.26863545, -0.3130674, 0.29023397, 0.073978...","[1.1471839, -0.665361, 0.7745614, 0.26716197, ...","[-0.6575592, 0.6522429, 0.5426037, -0.54347897...",{'Конструктивные особенности': ['Магнитная кон...,"[0.015568526, -0.03899538, 0.064447366, 0.0383...","[0.019788187, 0.0360369, -0.05522197, 0.010044..."
56763357,"Набор микропрепаратов Konus 25: ""Клетки и ткан...","{'1': 'EPG', '2': 'Электроника', '3': 'Оптичес...",,"[[0.66954195, 1.0643557, 0.78324044, -0.338267...","[-0.90570974, 1.0296293, 1.0769907, 0.27746, -...","[-0.7384308, 0.70784587, 0.3012653, -0.3583719...","{'Тип аксессуара': ['Набор микропрепаратов'], ...","[-0.033072222, -0.04237577, 0.020771954, 0.065...",
56961772,"Мобильный телефон BQ 1848 Step, черный","{'1': 'EPG', '2': 'Электроника', '3': 'Смартфо...",[черный],"[[0.6580482, -0.35763323, -0.16939065, -0.4249...","[0.13133773, -0.5577079, 0.32498044, 0.1917174...","[-0.44812852, 0.5283565, 0.28981736, -0.506841...","{'Тип карты памяти': ['microSD'], 'Число SIM-к...","[0.014727573, -0.025661988, 0.023943473, -0.00...",
61054740,"Штатив трипод Tripod 330A для фотоаппаратов, в...","{'1': 'EPG', '2': 'Электроника', '3': 'Штативы...",[черный],"[[-0.10406649, 0.080646515, -0.28668788, 0.739...","[0.21696381, 0.10989461, -0.08012986, 0.691861...","[-0.72692573, 0.75206333, 0.37740713, -0.52502...","{'Материал': ['Металл'], 'Количество секций, ш...","[0.043145332, -0.052424084, 0.017260496, 0.045...","[-0.0063637993, 0.040778656, -0.018901959, 0.0..."
...,...,...,...,...,...,...,...,...,...
820128810,"Комплект 2 шт, Чернила Cactus CS-EPT6733B пурп...","{'1': 'EPG', '2': 'Электроника', '3': 'Расходн...",[пурпурный],,"[-1.4492652, -0.80129164, -0.12344764, 0.71945...","[-0.8253241, 0.6785133, 0.53978086, -0.4888316...","{'Тип': ['Чернила для принтера'], 'Бренд печат...","[-0.003678058, -0.031628493, 0.0065589263, 0.0...",
821135769,"Защитное стекло закаленное Xiaomi Redmi 7, Y3 ...","{'1': 'EPG', '2': 'Электроника', '3': 'Защитны...",[черный],"[[0.09564891, 0.27437285, -0.19054827, -0.7992...","[0.012127608, -0.8534423, 0.5415518, -0.449125...","[-0.7413257, 0.46105132, 0.5639801, -0.5462132...","{'Вид стекла': ['3D'], 'Тип': ['Защитное стекл...","[-0.06858361, 0.027011767, -0.016400583, -0.02...","[0.070231415, -0.012321442, -0.06056241, -0.02..."
822095690,Системный блок ЮКОМС 9400-268 (AMD A6-9400 (3....,"{'1': 'EPG', '2': 'Электроника', '3': 'Компьют...",[черный],,"[0.4248176, -0.15944786, -0.22844064, 0.427686...","[-0.49261805, 0.56726897, 0.7037877, -0.697246...","{'Общий объем HDD, ГБ': ['10000'], 'Видеокарта...","[-0.04474233, -0.034224413, 0.026076552, 0.026...",
822101044,Системный блок ЮКОМС 9400-9 (AMD A6-9400 (3.4 ...,"{'1': 'EPG', '2': 'Электроника', '3': 'Компьют...",[черный],,"[0.4248176, -0.15944786, -0.22844064, 0.427686...","[-0.44051006, 0.54029673, 0.63768685, -0.68040...","{'Общий объем HDD, ГБ': ['8000'], 'Видеокарта'...","[-0.05541598, 0.000863006, 0.01093415, 0.02208...",


In [7]:
test_data = pd.read_parquet('./datasets/test_data.parquet').set_index('variantid')
test_data['characteristic_attributes_mapping'] = test_data['characteristic_attributes_mapping'].fillna('{}').apply(lambda x: json.loads(x))
test_data['categories'] = test_data['categories'].apply(lambda x: json.loads(x))
test_data['main_pic_embeddings_resnet_v1'] = test_data['main_pic_embeddings_resnet_v1'].apply(lambda x: x[0])
test_data = pd.concat([test_data, pd.read_parquet('./datasets/name_labse_embs_test.parquet').set_index('variantid')], axis=1)
test_data = pd.concat([test_data, pd.read_pickle('./datasets/neuro_embeds_test.pickle')], axis=1)
test_data

Unnamed: 0_level_0,name,categories,color_parsed,pic_embeddings_resnet_v1,main_pic_embeddings_resnet_v1,name_bert_64,characteristic_attributes_mapping,name_labse_768,neuro_768
variantid,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
51201254,Колодка TDM Electric четырехместная без заземл...,"{'1': 'EPG', '2': 'Электроника', '3': 'Сетевые...",[белый],"[[0.34383398, -0.2962618, 0.07987049, -0.08257...","[0.38310742, -0.7876679, 0.5018278, 0.20900711...","[-0.5060825, 0.5773388, 0.59435517, -0.4958292...","{'Страна-изготовитель': ['Китай'], 'Бренд': ['...","[-0.0058242553, 0.0010011946, 0.015051351, 0.0...","[-0.037606854, 0.08384453, -0.04124399, 0.0028..."
77151532,Клавиатура черная с черной рамкой для 25-011879,"{'1': 'EPG', '2': 'Электроника', '3': 'Запчаст...",[черный],,"[0.50964713, 0.7958329, -1.4113188, 0.19993813...","[-0.43467724, 0.6614495, 0.48050267, -0.588880...","{'Страна-изготовитель': ['Китай'], 'Комплектац...","[0.0088402, -0.0050699823, 0.026550002, -0.015...","[-0.052735697, 0.00019977099, 0.015895747, -0...."
89664856,"15.6"" Игровой ноутбук Acer Predator Helios 300...","{'1': 'EPG', '2': 'Электроника', '3': 'Компьют...",[черный],"[[0.7804302, -0.245446, -0.67754817, -0.614691...","[0.9958085, -0.113175124, -0.7623152, -0.91648...","[-0.70010763, 0.48152006, 0.47597092, -0.51727...",{'Видеокарта': ['NVIDIA GeForce RTX 2070 (8 Гб...,"[-0.026623247, -0.018851712, 0.011397564, -0.0...","[-0.00044866692, -0.07461986, -0.017260032, -0..."
90701982,Портативная колонка Borofone BR7 Empyreal Spor...,"{'1': 'EPG', '2': 'Электроника', '3': 'Акустик...","[red, красный]","[[-0.24636984, -1.0719914, -0.49986655, 0.3423...","[-0.26596686, -1.143009, -0.5289628, 0.4285588...","[-0.73135185, -0.039796613, 0.38907066, -0.496...","{'Основной материал корпуса': ['Металл'], 'Мак...","[0.016539363, 0.03778109, 0.025718935, 0.08805...","[0.0173606, 0.039641324, -0.024564413, -0.0056..."
92484118,Аккумулятор для Meizu BA712 ( M6s ),"{'1': 'EPG', '2': 'Электроника', '3': 'Батарей...",,,"[0.42047608, 0.75828516, 0.5440093, -0.0068945...","[-0.600158, 0.13944691, 0.48706242, -0.5050975...","{'Рекомендовано для': ['Meizu'], 'Бренд': ['Me...","[-0.0024493372, 0.02346121, 0.068452105, 0.023...","[0.04657542, -0.027531484, -0.015035957, 0.059..."
...,...,...,...,...,...,...,...,...,...
702785891,Кабель USB - Lightning HOCO X21 PLUS (черно-бе...,"{'1': 'EPG', '2': 'Электроника', '3': 'Кабели ...",[черный],"[[1.1820095, -0.16312826, 1.4916217, 0.0288323...","[0.3297959, -0.16444838, 0.9350716, 0.34787956...","[-0.66597974, 0.7140731, 0.43572947, -0.445908...","{'Бренд': ['hoco'], 'Тип': ['Кабель'], 'Цвет т...","[-0.031527344, -0.06875799, 0.03187686, -0.004...","[0.015840497, 0.022141043, -0.03528703, -0.017..."
704096517,Блок питания для ноутбука Asus f5gl (19V 90W 4...,"{'1': 'EPG', '2': 'Электроника', '3': 'Зарядны...",[черный],"[[-0.013610864, -0.68512607, 0.77639246, -1.04...","[0.2785852, -0.16053033, 1.1653559, 1.0619084,...","[-0.7575411, 0.4196694, 0.46428213, -0.4916808...","{'Комплектация': ['Зарядное устройство, сетево...","[-0.023706086, -0.012301952, -0.014316322, -0....","[0.009541714, -0.029578354, -0.015135301, 0.03..."
705874953,Оперативная память HyperX FURY Black DDR4 2666...,"{'1': 'EPG', '2': 'Электроника', '3': 'Операти...",[black],"[[0.34073856, 0.65070343, 0.31146732, 1.261663...","[0.31382418, 0.60041714, 0.3067428, 1.1233345,...","[-0.60506856, 0.4477128, 0.62255704, -0.720129...","{'Тайминги': ['16-18-18-29'], 'Пропускная спос...","[-0.028754005, -0.025122717, 0.048854, -0.0297...","[-0.03909694, 0.040358614, 0.025154725, 0.0568..."
706965102,8 ТБ Внутренний жесткий диск Toshiba TOSHIBA N...,"{'1': 'EPG', '2': 'Электроника', '3': 'Жесткие...",,"[[-0.9360045, -0.43083164, -1.1651772, 1.23836...","[0.404035, -0.20071658, -0.44533533, 0.2038879...","[-0.62029105, 0.45747545, 0.6659858, -0.671704...","{'Комплектация': ['HDWG480UZSVA'], 'Форм-факто...","[-0.026827315, 0.032079216, 0.040149417, -0.01...","[-0.014153612, -0.02059295, -0.041512348, 0.04..."


In [8]:
train_df = pd.read_pickle('./dataframes/train_df.pickle')
rtrain_df = pd.read_pickle('./dataframes/rtrain_df.pickle')
test_df = pd.read_pickle('./dataframes/test_df.pickle')
rtest_df = pd.read_pickle('./dataframes/rtest_df.pickle')

In [9]:
cat_features = [
    'cat3', 'cat4',
    'Страна-изготовитель_1', 'Страна-изготовитель_2', 
    'Оперативная память_1', 'Оперативная память_2',
    'Бренд процессора_1', 'Бренд процессора_2',
    'Модуль связи Bluetooth_1', 'Модуль связи Bluetooth_2',
    'Назначение_1', 'Назначение_2',
]
embedding_features = ['main_pic_1', 'main_pic_2', 'name_bert_1', 'name_bert_2', 'name_labse_1', 'name_labse_2']

In [10]:
train_pool = Pool(
    data=train_df.drop(['target']+embedding_features, axis = 1),
    cat_features=cat_features,
)
rtrain_pool = Pool(
    data=rtrain_df.drop(['target']+embedding_features, axis = 1),
    cat_features=cat_features,
)
test_pool = Pool(
    data=test_df.drop(embedding_features, axis = 1),
    cat_features=cat_features,
)
rtest_pool = Pool(
    data=rtest_df.drop(embedding_features, axis = 1),
    cat_features=cat_features,
)

In [11]:
model_cb_pseudo = CatBoostClassifier().load_model('./models/golden_model_cb_pseudo.cbm')

In [12]:
train_pairs['cb_pseudo_pred'] = rtrain_pairs['cb_pseudo_pred'] = \
(model_cb_pseudo.predict_proba(train_pool)[:, 1] + model_cb_pseudo.predict_proba(rtrain_pool)[:, 1]) / 2.

test_pairs['cb_pseudo_pred'] = rtest_pairs['cb_pseudo_pred'] = \
(model_cb_pseudo.predict_proba(test_pool)[:, 1] + model_cb_pseudo.predict_proba(rtest_pool)[:, 1]) / 2.

In [13]:
train_pool = Pool(
    data=train_df.drop(['target'], axis = 1),
    cat_features=cat_features,
    embedding_features=embedding_features
)
rtrain_pool = Pool(
    data=rtrain_df.drop(['target'], axis = 1),
    cat_features=cat_features,
    embedding_features=embedding_features
)
test_pool = Pool(
    data=test_df,
    cat_features=cat_features,
    embedding_features=embedding_features
)
rtest_pool = Pool(
    data=rtest_df,
    cat_features=cat_features,
    embedding_features=embedding_features
)

In [14]:
model_cb = CatBoostClassifier().load_model('./models/golden_model_cb.cbm')

In [15]:
train_pairs['cb_pred'] = rtrain_pairs['cb_pred'] = \
(model_cb.predict_proba(train_pool)[:, 1] + model_cb.predict_proba(rtrain_pool)[:, 1]) / 2.

test_pairs['cb_pred'] = rtest_pairs['cb_pred'] = \
(model_cb.predict_proba(test_pool)[:, 1] + model_cb.predict_proba(rtest_pool)[:, 1]) / 2.

In [16]:
val_pairs = train_pairs[pd.read_csv('./datasets/hard_idx.csv', index_col=0).values].copy()
rval_pairs = rtrain_pairs[pd.read_csv('./datasets/hard_idx.csv', index_col=0).values].copy()

In [17]:
mask = pd.read_csv('./datasets/val_idx.csv', index_col=0).values & ~pd.read_csv('./datasets/hard_idx.csv', index_col=0).values
train_pairs = train_pairs[mask].copy()
rtrain_pairs = rtrain_pairs[mask].copy()

In [18]:
train_pairs

Unnamed: 0,target,variantid1,variantid2,cb_pseudo_pred,cb_pred
1,1,53062686,536165289,0.180415,0.175911
6,1,62485795,62487150,0.293636,0.396222
7,1,64634116,539055461,0.632096,0.656641
8,1,67137384,781488410,0.301474,0.385981
10,1,70799285,72938934,0.586648,0.562208
...,...,...,...,...,...
306502,0,795842312,795842564,0.032249,0.022872
306510,0,801461635,801461672,0.051367,0.044114
306520,0,810680230,820119986,0.062628,0.050127
306524,0,814169571,822101626,0.085002,0.093381


In [19]:
val_pairs

Unnamed: 0,target,variantid1,variantid2,cb_pseudo_pred,cb_pred
16,0,78528663,551861879,0.031700,0.025394
48,1,89571302,590187339,0.879985,0.892545
65,1,90672972,355898383,0.985500,0.980606
66,1,90730073,736643943,0.845335,0.894928
77,1,91260321,422212895,0.906132,0.897436
...,...,...,...,...,...
306485,1,788619018,788623137,0.837735,0.851541
306492,0,794450037,816083556,0.047836,0.056798
306503,0,796354669,796354893,0.024209,0.026371
306511,0,801747460,801760537,0.022295,0.022546


In [20]:
test_pairs

Unnamed: 0,variantid1,variantid2,cb_pseudo_pred,cb_pred
0,52076340,290590137,0.085118,0.072876
1,64525522,204128919,0.065193,0.099754
2,77243372,479860557,0.321192,0.289299
3,86065820,540678372,0.521682,0.431156
4,91566575,258840506,0.221161,0.324661
...,...,...,...,...
18079,666998614,667074522,0.031549,0.030652
18080,670036240,670048449,0.284579,0.327252
18081,670284509,684323809,0.575465,0.632305
18082,692172005,704805270,0.828207,0.858653


# Features

In [21]:
def calc_dists(df, prefix, embs_1, embs_2):
    l1_dists, l2_dists, cos_dists = [], [], []
    for emb_1, emb_2 in zip(embs_1, embs_2):
        len_1 = (emb_1**2).sum()**0.5
        len_2 = (emb_2**2).sum()**0.5
        l1_dists.append(
            np.abs(emb_1 - emb_2).sum()
        )
        l2_dists.append(
            ((emb_1 - emb_2)**2).sum()**0.5
        )
        cos_dists.append(
            (emb_1 @ emb_2) / len_1 / len_2
        )
    df[f'{prefix}_l1_dist'] = l1_dists
    df[f'{prefix}_l2_dist'] = l2_dists
    df[f'{prefix}_cos_dist'] = cos_dists

In [53]:
def make_features(pairs, data):
    gc.collect()
    df = pairs.copy()
    neuro_1 = data.loc[df.variantid1, 'neuro_768'].values
    neuro_2 = data.loc[df.variantid2, 'neuro_768'].values
    calc_dists(
        df, 'neuro', 
        neuro_1,
        neuro_2
    )
    df[[f'neuro_emb{i}_1' for i in range(768)]] = list(neuro_1)
    df[[f'neuro_emb{i}_2' for i in range(768)]] = list(neuro_2)
    df = df.copy()
    return df.drop(['variantid1', 'variantid2'], axis=1)

In [54]:
%%time
train_df = make_features(train_pairs, train_data)
train_df

CPU times: total: 1min 6s
Wall time: 1min 6s


Unnamed: 0,target,cb_pseudo_pred,cb_pred,neuro_l1_dist,neuro_l2_dist,neuro_cos_dist,neuro_emb0_1,neuro_emb1_1,neuro_emb2_1,neuro_emb3_1,neuro_emb4_1,neuro_emb5_1,neuro_emb6_1,neuro_emb7_1,neuro_emb8_1,neuro_emb9_1,neuro_emb10_1,neuro_emb11_1,neuro_emb12_1,neuro_emb13_1,neuro_emb14_1,neuro_emb15_1,neuro_emb16_1,neuro_emb17_1,neuro_emb18_1,neuro_emb19_1,neuro_emb20_1,neuro_emb21_1,neuro_emb22_1,neuro_emb23_1,neuro_emb24_1,neuro_emb25_1,neuro_emb26_1,neuro_emb27_1,neuro_emb28_1,neuro_emb29_1,neuro_emb30_1,neuro_emb31_1,neuro_emb32_1,neuro_emb33_1,neuro_emb34_1,neuro_emb35_1,neuro_emb36_1,neuro_emb37_1,neuro_emb38_1,neuro_emb39_1,neuro_emb40_1,neuro_emb41_1,neuro_emb42_1,neuro_emb43_1,neuro_emb44_1,neuro_emb45_1,neuro_emb46_1,neuro_emb47_1,neuro_emb48_1,neuro_emb49_1,neuro_emb50_1,neuro_emb51_1,neuro_emb52_1,neuro_emb53_1,neuro_emb54_1,neuro_emb55_1,neuro_emb56_1,neuro_emb57_1,neuro_emb58_1,neuro_emb59_1,neuro_emb60_1,neuro_emb61_1,neuro_emb62_1,neuro_emb63_1,neuro_emb64_1,neuro_emb65_1,neuro_emb66_1,neuro_emb67_1,neuro_emb68_1,neuro_emb69_1,neuro_emb70_1,neuro_emb71_1,neuro_emb72_1,neuro_emb73_1,neuro_emb74_1,neuro_emb75_1,neuro_emb76_1,neuro_emb77_1,neuro_emb78_1,neuro_emb79_1,neuro_emb80_1,neuro_emb81_1,neuro_emb82_1,neuro_emb83_1,neuro_emb84_1,neuro_emb85_1,neuro_emb86_1,neuro_emb87_1,neuro_emb88_1,neuro_emb89_1,neuro_emb90_1,neuro_emb91_1,neuro_emb92_1,neuro_emb93_1,neuro_emb94_1,neuro_emb95_1,neuro_emb96_1,neuro_emb97_1,neuro_emb98_1,neuro_emb99_1,neuro_emb100_1,neuro_emb101_1,neuro_emb102_1,neuro_emb103_1,neuro_emb104_1,neuro_emb105_1,neuro_emb106_1,neuro_emb107_1,neuro_emb108_1,neuro_emb109_1,neuro_emb110_1,neuro_emb111_1,neuro_emb112_1,neuro_emb113_1,neuro_emb114_1,neuro_emb115_1,neuro_emb116_1,neuro_emb117_1,neuro_emb118_1,neuro_emb119_1,neuro_emb120_1,neuro_emb121_1,...,neuro_emb640_2,neuro_emb641_2,neuro_emb642_2,neuro_emb643_2,neuro_emb644_2,neuro_emb645_2,neuro_emb646_2,neuro_emb647_2,neuro_emb648_2,neuro_emb649_2,neuro_emb650_2,neuro_emb651_2,neuro_emb652_2,neuro_emb653_2,neuro_emb654_2,neuro_emb655_2,neuro_emb656_2,neuro_emb657_2,neuro_emb658_2,neuro_emb659_2,neuro_emb660_2,neuro_emb661_2,neuro_emb662_2,neuro_emb663_2,neuro_emb664_2,neuro_emb665_2,neuro_emb666_2,neuro_emb667_2,neuro_emb668_2,neuro_emb669_2,neuro_emb670_2,neuro_emb671_2,neuro_emb672_2,neuro_emb673_2,neuro_emb674_2,neuro_emb675_2,neuro_emb676_2,neuro_emb677_2,neuro_emb678_2,neuro_emb679_2,neuro_emb680_2,neuro_emb681_2,neuro_emb682_2,neuro_emb683_2,neuro_emb684_2,neuro_emb685_2,neuro_emb686_2,neuro_emb687_2,neuro_emb688_2,neuro_emb689_2,neuro_emb690_2,neuro_emb691_2,neuro_emb692_2,neuro_emb693_2,neuro_emb694_2,neuro_emb695_2,neuro_emb696_2,neuro_emb697_2,neuro_emb698_2,neuro_emb699_2,neuro_emb700_2,neuro_emb701_2,neuro_emb702_2,neuro_emb703_2,neuro_emb704_2,neuro_emb705_2,neuro_emb706_2,neuro_emb707_2,neuro_emb708_2,neuro_emb709_2,neuro_emb710_2,neuro_emb711_2,neuro_emb712_2,neuro_emb713_2,neuro_emb714_2,neuro_emb715_2,neuro_emb716_2,neuro_emb717_2,neuro_emb718_2,neuro_emb719_2,neuro_emb720_2,neuro_emb721_2,neuro_emb722_2,neuro_emb723_2,neuro_emb724_2,neuro_emb725_2,neuro_emb726_2,neuro_emb727_2,neuro_emb728_2,neuro_emb729_2,neuro_emb730_2,neuro_emb731_2,neuro_emb732_2,neuro_emb733_2,neuro_emb734_2,neuro_emb735_2,neuro_emb736_2,neuro_emb737_2,neuro_emb738_2,neuro_emb739_2,neuro_emb740_2,neuro_emb741_2,neuro_emb742_2,neuro_emb743_2,neuro_emb744_2,neuro_emb745_2,neuro_emb746_2,neuro_emb747_2,neuro_emb748_2,neuro_emb749_2,neuro_emb750_2,neuro_emb751_2,neuro_emb752_2,neuro_emb753_2,neuro_emb754_2,neuro_emb755_2,neuro_emb756_2,neuro_emb757_2,neuro_emb758_2,neuro_emb759_2,neuro_emb760_2,neuro_emb761_2,neuro_emb762_2,neuro_emb763_2,neuro_emb764_2,neuro_emb765_2,neuro_emb766_2,neuro_emb767_2
1,1,0.180415,0.175911,7.836064,0.349518,0.938919,-0.052533,-0.010321,-0.018409,0.019210,-0.035565,-0.021615,-0.007733,0.009223,-0.018848,-0.005369,0.048870,-0.036869,0.024449,-0.073497,0.051336,0.019532,0.027405,-0.020072,-0.051782,0.005662,0.033468,0.012370,-0.021671,0.032232,0.089572,-0.028749,-0.025404,-0.034889,-0.021541,0.013641,0.016660,-0.004992,0.046017,0.000753,-0.027249,-0.043440,0.005367,0.013667,-0.055865,0.005212,0.074097,-0.001832,-0.055264,-0.021586,-0.043754,-0.027593,0.062113,-0.018998,-0.042171,0.054622,0.007686,-0.006904,-0.059646,0.063061,0.000404,-0.061159,0.008407,0.038472,0.053030,-0.034579,0.014574,0.009309,0.009789,0.032344,-0.046324,0.091659,0.034418,-0.028864,-0.055046,0.062803,-0.040509,-0.000807,0.042615,0.006885,-0.055011,0.031836,0.052696,0.018935,0.003109,-0.049031,0.009331,-0.035544,-0.021560,0.074447,0.007626,0.024978,-0.010133,-0.022230,0.011347,-0.059181,0.007697,-0.028451,-0.026434,0.003373,-0.003054,0.001579,-0.006460,0.034971,0.045982,-0.031823,-0.025331,0.006353,0.035984,-0.009276,-0.019076,-0.046111,0.032565,-0.011219,-0.019230,-0.028431,0.055191,0.033232,-0.050771,0.007558,-0.009717,-0.002783,0.006632,0.070584,0.028159,0.028502,-0.026983,-0.046753,...,0.002060,-0.071942,0.026704,-0.041625,-0.033724,0.015036,0.051252,-0.100317,-0.053787,-0.001263,-0.047799,0.014483,-0.000151,0.010409,-0.029907,-0.022090,0.011604,-0.014732,-0.074514,-0.046521,0.068967,0.026727,-0.022415,0.031487,0.003055,-0.022728,-0.013704,0.059213,-0.018305,0.019263,0.001033,0.003389,-0.022522,-0.065247,-0.044647,0.008008,0.024158,-0.020667,0.053892,-0.050370,-0.036240,-0.027773,-0.045460,-0.025576,-0.011537,0.019915,0.002435,-0.049851,-0.009026,-0.069909,0.025779,0.085231,-0.047029,-0.067997,-0.082566,-0.036789,-0.009356,0.009873,0.024209,0.035280,-0.078903,-0.075137,0.045546,0.015556,0.072073,-0.023749,-0.019690,-0.026342,0.026552,-0.041214,0.003301,-0.025510,0.007107,0.016067,0.011676,-0.050904,0.025120,-0.033127,0.008473,0.021376,0.002927,0.040143,-0.006498,-0.037550,0.017705,0.017550,-0.064080,0.013703,-0.012530,0.033072,0.046809,0.029771,0.027865,0.010540,0.038064,-0.040250,0.059977,-0.045145,0.054262,-0.001467,-0.033185,-0.004836,-0.025181,-0.021404,-0.024222,0.001178,-0.029864,0.035245,0.047853,-0.026213,0.092067,-0.052657,-0.042336,0.009588,-0.050639,-0.024883,-0.022802,-0.060374,0.003297,-0.002825,-0.020281,-0.005190,-0.009711,0.037417,-0.031178,-0.031756,-0.006167,0.019504
6,1,0.293636,0.396222,8.726835,0.390595,0.923718,-0.020976,-0.045143,-0.015406,0.027676,-0.013045,-0.031581,-0.019189,0.027724,-0.021688,0.008349,0.056971,-0.047110,0.037094,-0.066915,0.025603,-0.009370,0.037100,0.007092,-0.065193,-0.000369,0.048436,0.020622,-0.012416,-0.018536,0.090664,-0.052969,0.006225,-0.011249,-0.029764,-0.006306,0.013082,-0.012446,0.057457,0.018282,-0.005435,-0.043172,-0.002670,-0.006485,-0.035092,-0.001217,0.081923,-0.005742,-0.055043,-0.005100,0.004116,-0.036780,0.082820,-0.051808,-0.049457,0.041861,-0.022825,-0.020421,-0.015951,0.065513,-0.011435,-0.013488,0.015549,0.019761,0.036638,-0.033042,0.013407,0.043423,-0.002401,0.029330,-0.014199,0.063133,0.056086,-0.039708,-0.053123,0.042226,-0.053265,-0.011555,0.028991,0.030472,-0.024680,0.002057,0.053952,-0.023770,0.008690,-0.008591,0.013087,-0.048837,-0.019044,0.082215,0.036194,-0.005000,-0.014485,-0.014015,0.025808,-0.043905,-0.011318,-0.033110,0.007265,0.012769,-0.013347,-0.015627,-0.006732,0.013646,0.024895,-0.005335,-0.000792,0.018881,0.015973,0.021593,-0.026293,-0.031979,0.007483,0.010966,-0.017643,-0.061654,0.065567,0.028678,-0.052217,-0.017241,-0.017156,0.001858,0.011284,0.065141,0.025465,-0.004849,-0.000370,-0.050102,...,0.065166,-0.051192,0.052458,-0.024280,-0.037039,0.022340,-0.004344,-0.073962,0.009662,-0.001664,-0.061240,0.019931,0.034039,0.048029,0.007928,-0.031701,-0.008992,0.008169,-0.066881,-0.018686,0.052615,0.026980,-0.009707,0.030879,0.002979,-0.080940,0.015333,0.056873,-0.026314,0.027079,0.003797,0.040137,0.017797,-0.050680,0.007113,0.010978,0.008198,-0.045981,0.018300,-0.037948,-0.060555,-0.045118,-0.059001,-0.069647,-0.019625,0.028230,-0.036467,-0.056824,0.008952,-0.037240,0.036999,0.068956,-0.019549,-0.091632,-0.062723,0.022638,0.010875,0.019333,0.020982,0.053472,-0.050562,-0.055164,0.070730,-0.020098,0.047900,-0.053113,0.000449,-0.041500,0.024072,-0.093349,-0.003256,-0.016452,0.001403,0.030579,-0.001475,-0.058956,0.047326,0.006519,0.046678,0.000375,-0.043552,0.039270,-0.003522,0.040301,-0.023439,0.014325,-0.061931,-0.024395,-0.047578,0.004786,0.042996,0.052893,-0.004406,0.037746,0.035445,-0.027968,0.025986,-0.036593,0.071582,0.009923,0.001354,-0.009852,-0.022267,-0.014937,0.007959,-0.038645,-0.015279,0.021998,0.053541,-0.020772,0.077268,-0.066834,-0.001928,-0.017571,-0.047611,-0.048989,-0.012301,-0.084132,-0.000934,-0.030706,0.002868,-0.040266,-0.027873,0.013982,0.006577,-0.006468,0.010451,0.020071
7,1,0.632096,0.656641,4.660522,0.208635,0.978236,-0.011690,0.016420,-0.019185,-0.001463,-0.039949,0.042183,-0.057112,-0.001151,-0.043595,0.000727,-0.001967,-0.041948,-0.032531,-0.082799,0.044880,0.039524,-0.007488,-0.022113,-0.007534,-0.039087,0.006332,-0.031952,-0.031511,0.013814,0.023864,0.011322,-0.017387,-0.036641,0.020899,0.022532,0.049954,-0.027428,0.052635,-0.032729,-0.037026,-0.070206,-0.049107,0.004149,-0.057716,0.038148,0.086895,0.012916,-0.025406,-0.030879,-0.012970,-0.038684,0.033464,-0.053146,-0.005108,0.038732,0.003365,0.063914,-0.069697,0.029248,-0.017822,-0.052696,-0.024931,0.017971,-0.008031,-0.022430,0.050103,-0.022678,-0.052919,0.029035,-0.024904,0.065577,0.032002,-0.056141,-0.043520,0.050324,-0.028467,-0.003729,0.040389,-0.049029,-0.046331,0.052340,0.003346,-0.007857,0.014447,-0.075554,-0.003925,-0.049070,-0.020818,0.066070,0.020148,0.028021,-0.035839,0.003484,-0.016326,-0.034317,0.030575,-0.018829,-0.066525,-0.030806,0.039832,0.022393,0.028605,0.033144,0.043933,-0.054465,-0.053464,-0.010045,0.007846,-0.040868,-0.012712,-0.049113,-0.014051,-0.054552,-0.061357,-0.026095,0.073528,0.023074,-0.010330,0.019795,-0.019843,0.009847,-0.004286,0.048401,0.013359,0.062496,-0.014359,-0.005028,...,-0.007854,-0.057589,-0.024000,-0.028029,-0.027277,0.018701,0.040219,-0.003525,-0.058816,0.016347,-0.011430,-0.001832,0.007887,-0.019873,-0.064467,-0.055866,0.030689,-0.014409,-0.076386,-0.016548,0.043225,0.055664,-0.010722,-0.036955,0.033414,0.008207,0.034421,-0.001540,-0.007785,-0.021185,0.060916,0.034752,-0.010058,-0.021870,-0.051634,-0.009901,0.069506,-0.004223,-0.003811,-0.056451,-0.043408,0.028865,-0.025481,0.015239,0.019833,-0.006340,-0.018354,-0.017782,-0.057321,-0.009987,-0.039721,0.015928,0.031345,-0.021334,-0.064813,0.025887,0.024719,0.049523,0.002906,0.046227,-0.033534,-0.007405,0.056287,0.025206,0.018513,-0.048567,-0.000666,-0.051615,0.024619,-0.051691,0.005294,-0.077366,-0.039473,0.017768,0.004634,-0.036341,-0.036211,0.026175,-0.016727,-0.056751,0.035328,0.026289,0.031484,-0.067304,0.071313,0.029225,-0.002607,-0.032151,0.030263,0.014152,0.012423,-0.025677,-0.015321,-0.028327,0.007617,0.023130,-0.017840,-0.017746,0.034115,-0.020648,-0.000937,-0.047807,0.013477,0.061693,-0.047603,0.015075,0.010827,0.047254,0.042482,-0.092026,0.033523,-0.042655,-0.037029,0.001679,-0.042737,-0.012501,0.021701,-0.013352,0.041898,0.002531,0.011722,0.009779,-0.002148,0.047544,0.020900,0.023644,-0.033818,-0.048896
8,1,0.301474,0.385981,3.958456,0.176286,0.984462,0.017534,0.038868,-0.031238,-0.014903,-0.032741,0.044969,-0.052109,-0.041142,-0.042286,-0.017079,-0.020923,-0.024740,-0.038269,-0.054511,0.048125,0.042815,-0.011877,-0.010265,0.019790,-0.049883,-0.020210,-0.041165,-0.023996,0.027286,-0.010650,0.012868,-0.026229,-0.031508,0.020493,0.027138,0.032884,-0.039353,0.043868,-0.030057,-0.030554,-0.053415,-0.057927,0.037622,-0.057874,0.048813,0.058536,0.032826,0.002815,-0.009563,-0.010988,-0.026045,-0.007782,-0.049423,0.015433,-0.005623,0.005190,0.080633,-0.051485,0.004279,-0.023949,-0.032112,-0.045076,-0.003263,-0.040169,-0.000813,0.047106,-0.021343,-0.069601,0.034598,-0.000318,0.071843,0.016701,-0.044663,0.010672,0.021560,-0.002855,-0.014092,0.043024,-0.057132,-0.043119,0.051453,-0.037315,0.004560,0.027751,-0.058274,-0.014906,-0.014855,-0.013570,0.028348,0.027222,0.050414,-0.018891,-0.000750,-0.039222,-0.030401,0.055620,-0.013600,-0.060789,-0.051981,0.041069,0.018455,0.061154,-0.009841,0.044431,-0.066305,-0.045908,-0.039208,0.002916,-0.057867,-0.015346,-0.015224,0.003053,-0.067642,-0.042824,-0.004842,0.057780,0.001895,0.002533,0.048597,-0.012151,0.022675,0.015651,0.043279,0.017596,0.057024,-0.022009,0.027201,...,-0.008428,-0.024401,-0.039502,-0.009557,-0.008109,0.024552,0.038099,0.035796,-0.037012,-0.017732,-0.007429,-0.001069,0.003595,-0.036941,-0.018137,-0.046503,0.017706,-0.003957,-0.066829,0.006648,0.010921,0.034615,0.028828,-0.045540,0.042557,0.020990,0.043798,-0.003862,0.003099,-0.015781,0.063749,0.000720,0.001920,-0.005164,-0.038341,-0.034480,0.038344,0.003700,-0.044490,-0.047315,-0.034226,0.029379,0.005234,0.032745,0.015239,-0.004715,-0.023521,-0.011705,-0.033745,0.018377,-0.075331,-0.034321,0.061852,0.001379,-0.029625,0.006074,0.022871,0.043592,-0.025232,0.026252,-0.016807,0.026511,0.028789,0.032878,-0.019982,-0.033732,-0.009207,-0.040880,0.012441,-0.025849,0.001041,-0.071529,-0.038895,0.027840,0.017326,-0.019277,-0.013809,0.028488,-0.037895,-0.064594,0.044065,-0.004190,0.025750,-0.074227,0.062246,0.015896,0.039011,-0.028284,0.044052,-0.007482,0.022898,-0.023076,-0.017118,-0.028610,-0.001833,0.034315,-0.053856,-0.017201,0.024917,-0.007657,-0.005138,-0.048995,0.028143,0.071245,-0.058475,0.031046,0.018292,0.040979,0.038795,-0.072059,0.015030,-0.024691,0.002755,0.018355,-0.020832,-0.004146,0.040031,-0.023122,0.006431,-0.004156,0.005641,0.017926,0.014959,0.041494,0.007740,0.036360,-0.038262,-0.057144
10,1,0.586648,0.562208,5.713414,0.255754,0.967295,-0.002543,0.029435,-0.007112,-0.043198,-0.023454,0.055567,-0.054406,0.015760,-0.046751,-0.008061,0.006914,-0.052569,-0.043407,-0.067387,0.037723,0.027766,-0.021145,0.000477,-0.013110,-0.056720,-0.035549,-0.022939,-0.025830,0.006101,0.001025,-0.010006,-0.008366,-0.028805,0.028508,0.010671,0.069422,-0.032081,0.021326,-0.059415,-0.041644,-0.046885,-0.068311,0.019375,-0.034709,0.020202,0.050740,0.016928,0.016345,-0.050038,0.014628,-0.022435,0.048175,-0.042369,-0.005621,0.011106,0.003171,0.080137,-0.062015,0.007644,-0.021215,-0.015075,-0.043192,-0.025854,-0.065235,-0.036629,0.040842,-0.023396,-0.050122,0.035380,0.027300,0.038739,0.064067,-0.033546,-0.034161,0.021614,-0.008504,-0.010217,0.023857,-0.020777,-0.008793,0.009624,-0.025385,0.010251,0.043669,-0.067134,0.000823,-0.006416,0.021069,0.038485,0.044857,0.026796,-0.058787,0.009123,0.022193,-0.007141,0.011485,0.005094,-0.063696,-0.031754,0.005702,0.002071,0.053142,-0.019981,0.025147,-0.040297,-0.058816,0.003888,-0.014271,-0.080474,-0.015057,-0.028321,-0.020863,-0.059217,-0.057723,-0.014121,0.046605,-0.049674,0.021837,0.033657,-0.040089,0.007360,-0.018662,0.022660,-0.000441,0.054951,0.023002,0.048733,...,-0.007086,-0.023420,0.008290,-0.020389,-0.032184,0.037010,0.049639,-0.012227,-0.060380,-0.005412,-0.023502,-0.012993,0.024636,-0.043780,-0.040901,-0.046006,0.044008,-0.012752,-0.068788,-0.030503,0.021307,0.048893,-0.017309,-0.018679,0.046388,-0.008700,0.036012,-0.011081,-0.038047,0.013688,0.064949,0.019558,-0.010367,-0.048382,-0.045805,-0.012113,0.047064,-0.014196,-0.010971,-0.043521,-0.048339,0.003000,-0.024299,0.001460,0.007800,0.017746,0.018435,-0.022465,-0.037267,0.021822,-0.078214,0.011793,0.055339,-0.024378,-0.053230,0.027740,-0.011357,0.060745,-0.012426,0.017595,-0.021998,-0.018652,0.071969,0.000742,0.027730,-0.037777,0.002225,-0.041560,0.026584,-0.043538,0.035339,-0.082260,-0.023910,0.004409,0.004803,-0.048353,0.000611,-0.002892,-0.026486,-0.049979,0.028916,0.002004,0.016706,-0.055852,0.063516,-0.002726,0.008624,-0.011100,0.025753,0.012176,0.010749,-0.031395,-0.049210,-0.017452,0.015796,0.021483,-0.029008,-0.039586,0.030173,-0.020549,0.023414,-0.024824,0.017403,0.060763,-0.062675,0.028367,0.014419,0.077169,0.018907,-0.053798,0.012386,-0.021474,-0.004572,0.030028,-0.018819,0.001568,0.031103,-0.020210,0.030866,0.022564,0.017403,0.029281,-0.021216,0.023711,0.019702,0.036239,-0.024460,-0.060940
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
306502,0,0.032249,0.022872,10.005867,0.447627,0.899815,0.057678,-0.067868,0.027262,0.042625,0.006632,-0.064349,0.022881,0.041245,0.032972,-0.052116,-0.006003,0.012777,0.046803,0.026277,0.000470,-0.064079,0.020504,0.056748,-0.004356,0.072267,0.024385,-0.006167,-0.029805,0.008067,-0.039962,-0.048232,-0.060275,0.031734,-0.047960,-0.042727,0.005528,0.047633,-0.002589,0.044173,0.032406,0.082181,0.048217,0.007299,-0.001079,-0.005540,-0.019588,0.028787,-0.064283,0.072155,-0.004929,-0.038013,0.017243,-0.016619,-0.033201,-0.005996,0.031414,-0.064573,0.026227,0.032759,0.000363,0.049814,-0.017320,0.008856,-0.027982,0.044566,-0.058185,0.050924,-0.013265,0.024954,0.055973,0.023921,-0.009354,-0.006909,-0.025507,-0.068305,-0.001439,-0.024025,0.039904,0.091662,0.012552,-0.069369,0.032235,-0.001469,0.020045,0.058433,-0.003842,-0.026228,-0.003447,0.005891,-0.001047,-0.030730,0.002906,-0.017312,-0.014612,0.003419,0.017311,0.003261,0.068996,0.040447,-0.046450,0.005444,-0.036133,-0.036897,0.005214,0.020890,0.055545,-0.007661,-0.003567,0.057954,-0.000819,0.037644,0.014546,-0.004032,0.034138,0.035025,0.012544,0.045345,0.023633,-0.013026,-0.001217,-0.025275,-0.041008,0.002961,0.013502,-0.086297,0.021167,-0.025377,...,0.021375,0.029645,0.034072,-0.011682,-0.007620,0.047773,-0.019385,-0.050662,0.004019,0.050495,-0.051353,0.043788,0.082205,0.063761,0.064374,-0.044711,0.004285,0.046391,-0.012563,-0.035565,-0.005032,-0.079581,-0.014132,0.000979,-0.029766,-0.014317,0.018611,-0.034817,-0.013880,0.059203,-0.040985,0.022248,0.006623,-0.049916,0.008981,0.005817,-0.086377,-0.027044,-0.022004,-0.041924,0.003735,0.026988,0.014956,-0.054515,-0.023806,0.076897,0.018930,-0.044506,0.023950,-0.013024,-0.005625,0.020394,-0.037230,-0.049585,0.057643,-0.020659,0.022708,-0.065571,0.055926,0.000486,0.029367,-0.030892,-0.029559,-0.053900,0.028332,0.017416,0.036783,0.034005,0.029007,-0.026226,0.007520,0.025881,0.035534,-0.018206,-0.021071,-0.021585,0.072909,-0.039366,0.016316,0.022997,-0.094718,-0.059538,0.030377,0.019400,-0.025187,-0.030419,-0.033075,0.016798,-0.037463,0.057246,0.057234,0.050248,-0.031039,-0.053337,-0.036440,0.031605,-0.005919,0.046931,-0.014440,0.039704,0.016877,0.000866,0.071014,-0.011408,-0.002970,-0.015479,-0.027060,0.010524,-0.014597,0.048063,0.007965,-0.069661,0.007903,-0.001499,-0.011031,-0.015903,0.014645,-0.038083,0.015657,-0.013656,-0.019992,-0.010109,0.029973,-0.002756,-0.029173,0.032712,0.004944,-0.010951
306510,0,0.051367,0.044114,0.000023,0.000001,1.000000,-0.050865,-0.031015,0.018722,-0.013247,-0.007015,-0.001438,0.060876,0.008595,-0.000086,0.040194,0.045565,0.047729,0.066559,0.046900,-0.020905,-0.043895,0.021700,0.024734,-0.040810,0.048190,0.003155,0.032079,-0.007533,0.016612,-0.001901,-0.054207,0.047343,0.046870,-0.000010,-0.033504,-0.017791,0.023973,-0.032101,0.022877,0.008989,0.043942,0.044372,0.014075,0.047008,-0.011343,-0.022079,0.014303,0.057892,0.003959,0.068086,0.053398,0.010167,0.039353,-0.002445,0.020719,-0.033600,-0.044579,0.046746,-0.033660,0.006592,-0.022818,0.007504,0.033685,0.008406,-0.001022,-0.023820,0.038327,0.117806,-0.045111,-0.013626,-0.033596,0.006685,0.043201,0.010074,-0.055090,-0.000378,0.018014,0.005221,0.047580,0.054870,-0.080007,0.083942,0.000338,-0.014775,0.041413,-0.071506,-0.004589,0.003834,-0.018464,0.001319,-0.023922,-0.037112,0.015199,0.046244,0.070171,-0.020856,-0.038096,0.025565,-0.003845,-0.052621,0.014548,-0.066795,0.008206,-0.018747,-0.023714,0.025467,-0.012503,0.005283,0.069343,-0.005021,-0.005340,0.051992,0.023872,0.047948,-0.018372,-0.003062,0.012295,-0.024357,-0.002582,0.032028,-0.053571,-0.000584,-0.039673,0.029550,-0.059735,-0.015826,-0.020681,...,0.025092,0.033160,0.047982,-0.015328,0.013715,-0.072829,-0.067806,-0.012878,0.054996,0.019737,0.019778,0.026244,0.027084,-0.020200,0.050818,0.062497,-0.023755,0.031330,0.035394,0.011601,-0.027001,-0.066501,-0.010888,0.058965,0.000056,-0.045450,-0.026417,0.062099,-0.021291,0.020274,-0.048092,0.000469,0.028278,-0.008373,0.005604,-0.004870,-0.020536,-0.012359,-0.009372,0.079740,0.017159,-0.043916,-0.040549,-0.074100,-0.007627,0.027010,0.023364,0.017991,0.043084,-0.018178,-0.000096,-0.000925,0.002998,-0.010338,-0.002319,-0.028172,-0.038863,-0.007062,-0.012265,-0.050037,-0.007206,0.000824,0.012480,0.029110,-0.003362,0.009295,0.008680,0.032560,0.031583,-0.013468,0.047678,0.067149,0.022276,-0.004656,0.021134,0.005502,0.050163,0.001281,0.003921,-0.040420,-0.044105,-0.012305,-0.054858,0.002961,-0.042299,-0.008397,-0.020843,0.004527,-0.065203,-0.003076,-0.028711,0.069539,-0.019592,0.037724,0.000710,-0.046421,0.014620,0.030005,0.024736,-0.012060,0.038359,0.047357,-0.021529,-0.047348,0.028538,-0.051781,-0.010254,0.033528,-0.047558,0.062810,0.015283,0.009075,0.073817,0.012827,0.024458,0.006560,-0.054531,0.042832,0.021957,-0.010263,-0.003666,-0.052402,-0.044925,-0.045718,0.022304,-0.008545,0.032012,0.092396
306520,0,0.062628,0.050127,16.342211,0.731040,0.732790,-0.033469,0.021019,-0.015605,0.069191,-0.026031,-0.030137,0.003087,0.001085,-0.004620,0.016377,-0.026186,0.039304,0.046956,0.040034,-0.032414,-0.033167,0.035272,0.010412,-0.006761,0.051701,0.039436,0.015426,-0.017248,0.011682,0.027129,-0.021373,0.020781,0.055132,-0.027626,-0.030336,0.012440,0.030315,0.025169,0.020368,-0.002786,0.006148,0.082936,-0.004920,-0.037308,0.038054,0.036525,-0.027097,-0.060623,0.020549,-0.007246,-0.042898,-0.019740,0.033321,-0.003022,0.063541,0.002805,-0.081900,0.027897,0.018741,-0.011365,-0.055080,-0.014536,0.082372,0.056535,0.014120,0.027795,0.035093,0.017867,-0.011996,-0.077461,-0.017177,-0.065055,0.001060,0.003666,-0.032027,-0.059272,-0.005647,0.035037,0.012656,0.007539,0.023744,0.094065,-0.018075,-0.014024,0.034705,-0.013486,-0.080558,-0.069979,0.021368,-0.039954,-0.006954,0.003933,-0.007512,-0.030100,0.011352,0.043047,-0.048082,0.039134,0.004175,0.035502,0.066442,-0.084292,0.040853,0.026190,-0.041865,-0.018257,-0.048349,0.041095,0.067966,0.041399,-0.003171,-0.000308,0.018596,0.012040,-0.001529,0.018505,0.097976,-0.071478,-0.005445,0.035393,-0.016640,-0.049102,0.080064,0.007855,-0.006957,-0.046524,-0.047202,...,0.057976,-0.017412,-0.011267,-0.032801,-0.005831,-0.080857,-0.061376,0.054479,0.058956,0.044526,0.019566,0.020218,-0.020132,0.018746,-0.003312,-0.007975,-0.052875,0.046637,0.002218,0.038901,0.034704,0.035475,0.001563,-0.001057,0.024844,-0.078675,0.017894,0.036103,0.015135,-0.001932,0.007057,0.052964,0.039704,0.015178,0.008556,0.009089,0.026575,-0.035556,0.002478,-0.003490,-0.039534,0.009333,-0.047552,-0.045938,-0.000682,-0.023235,-0.077062,0.001852,-0.022048,-0.045034,0.039577,0.015769,0.001251,-0.031566,-0.046622,0.048046,0.071499,0.039323,0.005848,0.048805,-0.010178,0.008823,0.038495,0.034769,-0.018738,-0.058553,0.020942,-0.090770,-0.003706,-0.110750,-0.011405,-0.029868,-0.031981,0.027825,0.035016,-0.026835,-0.002113,0.067736,0.047635,-0.068754,-0.016312,-0.003825,0.042038,0.026823,-0.031010,0.038360,-0.000165,-0.089227,-0.038983,-0.018560,-0.006572,0.034889,-0.006639,0.054377,-0.020978,0.000047,-0.030819,0.049270,0.046030,0.009344,0.025100,-0.003488,0.016210,0.000991,0.043704,-0.056235,-0.023832,-0.006171,0.013305,-0.063134,0.040878,-0.032570,0.005423,-0.039519,-0.033565,-0.024695,-0.029208,-0.024336,0.015720,-0.034078,0.014501,-0.067129,-0.007332,0.027043,0.056418,0.026652,0.004735,0.029643
306524,0,0.085002,0.093381,13.459804,0.608179,0.815059,-0.015614,0.010031,-0.002631,-0.041415,-0.025834,0.002455,-0.040742,-0.001509,-0.068643,0.001327,0.019093,0.008542,0.035834,-0.005710,0.027202,0.080408,0.005802,-0.016807,0.029287,-0.021411,-0.005520,-0.007791,0.022791,0.011229,0.026709,0.018486,-0.025013,0.042968,-0.004813,-0.015037,-0.069034,0.019542,0.011712,-0.034980,0.053099,0.039510,-0.045370,-0.046076,0.024033,-0.036387,0.038008,0.032016,-0.008532,-0.027047,-0.025878,-0.005936,-0.000644,0.001001,0.003191,-0.023426,-0.022524,0.019506,0.033449,-0.032545,0.018979,0.023951,-0.004856,0.028570,0.013938,-0.029570,0.001656,-0.020628,-0.042969,0.014581,0.039418,-0.021037,-0.004414,-0.082044,-0.037037,-0.004727,0.031077,-0.019023,-0.003892,0.004678,-0.018814,-0.031377,-0.060253,-0.032450,-0.154843,-0.025159,-0.042023,0.021917,0.064936,-0.047701,-0.052784,-0.028578,0.029861,0.026401,-0.068003,-0.028094,0.022905,0.040676,-0.038418,0.092887,0.012204,-0.067819,-0.010524,0.042715,-0.034496,-0.026124,-0.019169,0.008224,0.017592,0.005533,0.049259,-0.052507,-0.045810,0.046238,0.018769,0.076147,0.018516,-0.048189,0.040899,-0.041509,0.036284,0.018047,0.043259,0.001968,-0.011695,0.041496,-0.010896,0.017213,...,0.016729,0.017981,0.006989,0.013629,-0.040623,0.011293,0.014565,0.045841,0.030820,-0.046904,0.036461,-0.066181,-0.031706,-0.020219,-0.004099,0.011813,-0.082676,-0.019328,0.015533,0.045243,-0.018856,0.021542,-0.021605,-0.046268,-0.032560,0.001310,-0.040883,0.017897,-0.030662,0.017896,-0.040442,-0.025753,-0.050281,0.038428,0.022341,0.015897,0.033328,0.017364,0.001506,0.023823,0.051581,-0.043418,-0.018980,0.038885,0.007126,-0.039285,0.036219,0.004631,-0.030237,0.044623,0.032122,0.013535,-0.042550,0.110228,-0.017526,-0.002727,0.029659,0.049145,0.047345,-0.002753,0.007668,0.058460,-0.015800,0.040605,-0.006792,-0.012554,0.019546,-0.064958,0.002769,0.002616,0.032382,0.006081,0.045040,-0.014685,-0.044518,0.085477,-0.025007,0.003455,-0.010735,0.039196,0.024614,0.036536,-0.041097,0.037661,-0.029181,-0.013793,0.027134,0.023298,-0.047169,-0.018990,-0.060982,-0.035232,-0.022197,0.017991,-0.031974,-0.000017,0.030142,-0.030862,-0.010998,-0.064693,-0.030903,-0.007228,-0.021223,0.017980,0.069470,0.014818,0.032276,0.011386,-0.039572,0.020848,-0.003988,0.090472,0.018408,-0.011151,0.021722,0.001635,0.042238,0.005464,0.006168,0.022049,-0.006072,0.049216,0.008521,0.027402,0.016390,-0.010263,-0.011260,0.033748


In [55]:
rtrain_df = make_features(rtrain_pairs, train_data)
val_df = make_features(val_pairs, train_data)
rval_df = make_features(rval_pairs, train_data)

# Model

In [56]:
all_train = pd.concat([train_df, rtrain_df], axis=0)
all_val = pd.concat([val_df, rval_df], axis=0)
all_train

Unnamed: 0,target,cb_pseudo_pred,cb_pred,neuro_l1_dist,neuro_l2_dist,neuro_cos_dist,neuro_emb0_1,neuro_emb1_1,neuro_emb2_1,neuro_emb3_1,neuro_emb4_1,neuro_emb5_1,neuro_emb6_1,neuro_emb7_1,neuro_emb8_1,neuro_emb9_1,neuro_emb10_1,neuro_emb11_1,neuro_emb12_1,neuro_emb13_1,neuro_emb14_1,neuro_emb15_1,neuro_emb16_1,neuro_emb17_1,neuro_emb18_1,neuro_emb19_1,neuro_emb20_1,neuro_emb21_1,neuro_emb22_1,neuro_emb23_1,neuro_emb24_1,neuro_emb25_1,neuro_emb26_1,neuro_emb27_1,neuro_emb28_1,neuro_emb29_1,neuro_emb30_1,neuro_emb31_1,neuro_emb32_1,neuro_emb33_1,neuro_emb34_1,neuro_emb35_1,neuro_emb36_1,neuro_emb37_1,neuro_emb38_1,neuro_emb39_1,neuro_emb40_1,neuro_emb41_1,neuro_emb42_1,neuro_emb43_1,neuro_emb44_1,neuro_emb45_1,neuro_emb46_1,neuro_emb47_1,neuro_emb48_1,neuro_emb49_1,neuro_emb50_1,neuro_emb51_1,neuro_emb52_1,neuro_emb53_1,neuro_emb54_1,neuro_emb55_1,neuro_emb56_1,neuro_emb57_1,neuro_emb58_1,neuro_emb59_1,neuro_emb60_1,neuro_emb61_1,neuro_emb62_1,neuro_emb63_1,neuro_emb64_1,neuro_emb65_1,neuro_emb66_1,neuro_emb67_1,neuro_emb68_1,neuro_emb69_1,neuro_emb70_1,neuro_emb71_1,neuro_emb72_1,neuro_emb73_1,neuro_emb74_1,neuro_emb75_1,neuro_emb76_1,neuro_emb77_1,neuro_emb78_1,neuro_emb79_1,neuro_emb80_1,neuro_emb81_1,neuro_emb82_1,neuro_emb83_1,neuro_emb84_1,neuro_emb85_1,neuro_emb86_1,neuro_emb87_1,neuro_emb88_1,neuro_emb89_1,neuro_emb90_1,neuro_emb91_1,neuro_emb92_1,neuro_emb93_1,neuro_emb94_1,neuro_emb95_1,neuro_emb96_1,neuro_emb97_1,neuro_emb98_1,neuro_emb99_1,neuro_emb100_1,neuro_emb101_1,neuro_emb102_1,neuro_emb103_1,neuro_emb104_1,neuro_emb105_1,neuro_emb106_1,neuro_emb107_1,neuro_emb108_1,neuro_emb109_1,neuro_emb110_1,neuro_emb111_1,neuro_emb112_1,neuro_emb113_1,neuro_emb114_1,neuro_emb115_1,neuro_emb116_1,neuro_emb117_1,neuro_emb118_1,neuro_emb119_1,neuro_emb120_1,neuro_emb121_1,...,neuro_emb640_2,neuro_emb641_2,neuro_emb642_2,neuro_emb643_2,neuro_emb644_2,neuro_emb645_2,neuro_emb646_2,neuro_emb647_2,neuro_emb648_2,neuro_emb649_2,neuro_emb650_2,neuro_emb651_2,neuro_emb652_2,neuro_emb653_2,neuro_emb654_2,neuro_emb655_2,neuro_emb656_2,neuro_emb657_2,neuro_emb658_2,neuro_emb659_2,neuro_emb660_2,neuro_emb661_2,neuro_emb662_2,neuro_emb663_2,neuro_emb664_2,neuro_emb665_2,neuro_emb666_2,neuro_emb667_2,neuro_emb668_2,neuro_emb669_2,neuro_emb670_2,neuro_emb671_2,neuro_emb672_2,neuro_emb673_2,neuro_emb674_2,neuro_emb675_2,neuro_emb676_2,neuro_emb677_2,neuro_emb678_2,neuro_emb679_2,neuro_emb680_2,neuro_emb681_2,neuro_emb682_2,neuro_emb683_2,neuro_emb684_2,neuro_emb685_2,neuro_emb686_2,neuro_emb687_2,neuro_emb688_2,neuro_emb689_2,neuro_emb690_2,neuro_emb691_2,neuro_emb692_2,neuro_emb693_2,neuro_emb694_2,neuro_emb695_2,neuro_emb696_2,neuro_emb697_2,neuro_emb698_2,neuro_emb699_2,neuro_emb700_2,neuro_emb701_2,neuro_emb702_2,neuro_emb703_2,neuro_emb704_2,neuro_emb705_2,neuro_emb706_2,neuro_emb707_2,neuro_emb708_2,neuro_emb709_2,neuro_emb710_2,neuro_emb711_2,neuro_emb712_2,neuro_emb713_2,neuro_emb714_2,neuro_emb715_2,neuro_emb716_2,neuro_emb717_2,neuro_emb718_2,neuro_emb719_2,neuro_emb720_2,neuro_emb721_2,neuro_emb722_2,neuro_emb723_2,neuro_emb724_2,neuro_emb725_2,neuro_emb726_2,neuro_emb727_2,neuro_emb728_2,neuro_emb729_2,neuro_emb730_2,neuro_emb731_2,neuro_emb732_2,neuro_emb733_2,neuro_emb734_2,neuro_emb735_2,neuro_emb736_2,neuro_emb737_2,neuro_emb738_2,neuro_emb739_2,neuro_emb740_2,neuro_emb741_2,neuro_emb742_2,neuro_emb743_2,neuro_emb744_2,neuro_emb745_2,neuro_emb746_2,neuro_emb747_2,neuro_emb748_2,neuro_emb749_2,neuro_emb750_2,neuro_emb751_2,neuro_emb752_2,neuro_emb753_2,neuro_emb754_2,neuro_emb755_2,neuro_emb756_2,neuro_emb757_2,neuro_emb758_2,neuro_emb759_2,neuro_emb760_2,neuro_emb761_2,neuro_emb762_2,neuro_emb763_2,neuro_emb764_2,neuro_emb765_2,neuro_emb766_2,neuro_emb767_2
1,1,0.180415,0.175911,7.836064,0.349518,0.938919,-0.052533,-0.010321,-0.018409,0.019210,-0.035565,-0.021615,-0.007733,0.009223,-0.018848,-0.005369,0.048870,-0.036869,0.024449,-0.073497,0.051336,0.019532,0.027405,-0.020072,-0.051782,0.005662,0.033468,0.012370,-0.021671,0.032232,0.089572,-0.028749,-0.025404,-0.034889,-0.021541,0.013641,0.016660,-0.004992,0.046017,0.000753,-0.027249,-0.043440,0.005367,0.013667,-0.055865,0.005212,0.074097,-0.001832,-0.055264,-0.021586,-0.043754,-0.027593,0.062113,-0.018998,-0.042171,0.054622,0.007686,-0.006904,-0.059646,0.063061,0.000404,-0.061159,0.008407,0.038472,0.053030,-0.034579,0.014574,0.009309,0.009789,0.032344,-0.046324,0.091659,0.034418,-0.028864,-0.055046,0.062803,-0.040509,-0.000807,0.042615,0.006885,-0.055011,0.031836,0.052696,0.018935,0.003109,-0.049031,0.009331,-0.035544,-0.021560,0.074447,0.007626,0.024978,-0.010133,-0.022230,0.011347,-0.059181,0.007697,-0.028451,-0.026434,0.003373,-0.003054,0.001579,-0.006460,0.034971,0.045982,-0.031823,-0.025331,0.006353,0.035984,-0.009276,-0.019076,-0.046111,0.032565,-0.011219,-0.019230,-0.028431,0.055191,0.033232,-0.050771,0.007558,-0.009717,-0.002783,0.006632,0.070584,0.028159,0.028502,-0.026983,-0.046753,...,0.002060,-0.071942,0.026704,-0.041625,-0.033724,0.015036,0.051252,-0.100317,-0.053787,-0.001263,-0.047799,0.014483,-0.000151,0.010409,-0.029907,-0.022090,0.011604,-0.014732,-0.074514,-0.046521,0.068967,0.026727,-0.022415,0.031487,0.003055,-0.022728,-0.013704,0.059213,-0.018305,0.019263,0.001033,0.003389,-0.022522,-0.065247,-0.044647,0.008008,0.024158,-0.020667,0.053892,-0.050370,-0.036240,-0.027773,-0.045460,-0.025576,-0.011537,0.019915,0.002435,-0.049851,-0.009026,-0.069909,0.025779,0.085231,-0.047029,-0.067997,-0.082566,-0.036789,-0.009356,0.009873,0.024209,0.035280,-0.078903,-0.075137,0.045546,0.015556,0.072073,-0.023749,-0.019690,-0.026342,0.026552,-0.041214,0.003301,-0.025510,0.007107,0.016067,0.011676,-0.050904,0.025120,-0.033127,0.008473,0.021376,0.002927,0.040143,-0.006498,-0.037550,0.017705,0.017550,-0.064080,0.013703,-0.012530,0.033072,0.046809,0.029771,0.027865,0.010540,0.038064,-0.040250,0.059977,-0.045145,0.054262,-0.001467,-0.033185,-0.004836,-0.025181,-0.021404,-0.024222,0.001178,-0.029864,0.035245,0.047853,-0.026213,0.092067,-0.052657,-0.042336,0.009588,-0.050639,-0.024883,-0.022802,-0.060374,0.003297,-0.002825,-0.020281,-0.005190,-0.009711,0.037417,-0.031178,-0.031756,-0.006167,0.019504
6,1,0.293636,0.396222,8.726835,0.390595,0.923718,-0.020976,-0.045143,-0.015406,0.027676,-0.013045,-0.031581,-0.019189,0.027724,-0.021688,0.008349,0.056971,-0.047110,0.037094,-0.066915,0.025603,-0.009370,0.037100,0.007092,-0.065193,-0.000369,0.048436,0.020622,-0.012416,-0.018536,0.090664,-0.052969,0.006225,-0.011249,-0.029764,-0.006306,0.013082,-0.012446,0.057457,0.018282,-0.005435,-0.043172,-0.002670,-0.006485,-0.035092,-0.001217,0.081923,-0.005742,-0.055043,-0.005100,0.004116,-0.036780,0.082820,-0.051808,-0.049457,0.041861,-0.022825,-0.020421,-0.015951,0.065513,-0.011435,-0.013488,0.015549,0.019761,0.036638,-0.033042,0.013407,0.043423,-0.002401,0.029330,-0.014199,0.063133,0.056086,-0.039708,-0.053123,0.042226,-0.053265,-0.011555,0.028991,0.030472,-0.024680,0.002057,0.053952,-0.023770,0.008690,-0.008591,0.013087,-0.048837,-0.019044,0.082215,0.036194,-0.005000,-0.014485,-0.014015,0.025808,-0.043905,-0.011318,-0.033110,0.007265,0.012769,-0.013347,-0.015627,-0.006732,0.013646,0.024895,-0.005335,-0.000792,0.018881,0.015973,0.021593,-0.026293,-0.031979,0.007483,0.010966,-0.017643,-0.061654,0.065567,0.028678,-0.052217,-0.017241,-0.017156,0.001858,0.011284,0.065141,0.025465,-0.004849,-0.000370,-0.050102,...,0.065166,-0.051192,0.052458,-0.024280,-0.037039,0.022340,-0.004344,-0.073962,0.009662,-0.001664,-0.061240,0.019931,0.034039,0.048029,0.007928,-0.031701,-0.008992,0.008169,-0.066881,-0.018686,0.052615,0.026980,-0.009707,0.030879,0.002979,-0.080940,0.015333,0.056873,-0.026314,0.027079,0.003797,0.040137,0.017797,-0.050680,0.007113,0.010978,0.008198,-0.045981,0.018300,-0.037948,-0.060555,-0.045118,-0.059001,-0.069647,-0.019625,0.028230,-0.036467,-0.056824,0.008952,-0.037240,0.036999,0.068956,-0.019549,-0.091632,-0.062723,0.022638,0.010875,0.019333,0.020982,0.053472,-0.050562,-0.055164,0.070730,-0.020098,0.047900,-0.053113,0.000449,-0.041500,0.024072,-0.093349,-0.003256,-0.016452,0.001403,0.030579,-0.001475,-0.058956,0.047326,0.006519,0.046678,0.000375,-0.043552,0.039270,-0.003522,0.040301,-0.023439,0.014325,-0.061931,-0.024395,-0.047578,0.004786,0.042996,0.052893,-0.004406,0.037746,0.035445,-0.027968,0.025986,-0.036593,0.071582,0.009923,0.001354,-0.009852,-0.022267,-0.014937,0.007959,-0.038645,-0.015279,0.021998,0.053541,-0.020772,0.077268,-0.066834,-0.001928,-0.017571,-0.047611,-0.048989,-0.012301,-0.084132,-0.000934,-0.030706,0.002868,-0.040266,-0.027873,0.013982,0.006577,-0.006468,0.010451,0.020071
7,1,0.632096,0.656641,4.660522,0.208635,0.978236,-0.011690,0.016420,-0.019185,-0.001463,-0.039949,0.042183,-0.057112,-0.001151,-0.043595,0.000727,-0.001967,-0.041948,-0.032531,-0.082799,0.044880,0.039524,-0.007488,-0.022113,-0.007534,-0.039087,0.006332,-0.031952,-0.031511,0.013814,0.023864,0.011322,-0.017387,-0.036641,0.020899,0.022532,0.049954,-0.027428,0.052635,-0.032729,-0.037026,-0.070206,-0.049107,0.004149,-0.057716,0.038148,0.086895,0.012916,-0.025406,-0.030879,-0.012970,-0.038684,0.033464,-0.053146,-0.005108,0.038732,0.003365,0.063914,-0.069697,0.029248,-0.017822,-0.052696,-0.024931,0.017971,-0.008031,-0.022430,0.050103,-0.022678,-0.052919,0.029035,-0.024904,0.065577,0.032002,-0.056141,-0.043520,0.050324,-0.028467,-0.003729,0.040389,-0.049029,-0.046331,0.052340,0.003346,-0.007857,0.014447,-0.075554,-0.003925,-0.049070,-0.020818,0.066070,0.020148,0.028021,-0.035839,0.003484,-0.016326,-0.034317,0.030575,-0.018829,-0.066525,-0.030806,0.039832,0.022393,0.028605,0.033144,0.043933,-0.054465,-0.053464,-0.010045,0.007846,-0.040868,-0.012712,-0.049113,-0.014051,-0.054552,-0.061357,-0.026095,0.073528,0.023074,-0.010330,0.019795,-0.019843,0.009847,-0.004286,0.048401,0.013359,0.062496,-0.014359,-0.005028,...,-0.007854,-0.057589,-0.024000,-0.028029,-0.027277,0.018701,0.040219,-0.003525,-0.058816,0.016347,-0.011430,-0.001832,0.007887,-0.019873,-0.064467,-0.055866,0.030689,-0.014409,-0.076386,-0.016548,0.043225,0.055664,-0.010722,-0.036955,0.033414,0.008207,0.034421,-0.001540,-0.007785,-0.021185,0.060916,0.034752,-0.010058,-0.021870,-0.051634,-0.009901,0.069506,-0.004223,-0.003811,-0.056451,-0.043408,0.028865,-0.025481,0.015239,0.019833,-0.006340,-0.018354,-0.017782,-0.057321,-0.009987,-0.039721,0.015928,0.031345,-0.021334,-0.064813,0.025887,0.024719,0.049523,0.002906,0.046227,-0.033534,-0.007405,0.056287,0.025206,0.018513,-0.048567,-0.000666,-0.051615,0.024619,-0.051691,0.005294,-0.077366,-0.039473,0.017768,0.004634,-0.036341,-0.036211,0.026175,-0.016727,-0.056751,0.035328,0.026289,0.031484,-0.067304,0.071313,0.029225,-0.002607,-0.032151,0.030263,0.014152,0.012423,-0.025677,-0.015321,-0.028327,0.007617,0.023130,-0.017840,-0.017746,0.034115,-0.020648,-0.000937,-0.047807,0.013477,0.061693,-0.047603,0.015075,0.010827,0.047254,0.042482,-0.092026,0.033523,-0.042655,-0.037029,0.001679,-0.042737,-0.012501,0.021701,-0.013352,0.041898,0.002531,0.011722,0.009779,-0.002148,0.047544,0.020900,0.023644,-0.033818,-0.048896
8,1,0.301474,0.385981,3.958456,0.176286,0.984462,0.017534,0.038868,-0.031238,-0.014903,-0.032741,0.044969,-0.052109,-0.041142,-0.042286,-0.017079,-0.020923,-0.024740,-0.038269,-0.054511,0.048125,0.042815,-0.011877,-0.010265,0.019790,-0.049883,-0.020210,-0.041165,-0.023996,0.027286,-0.010650,0.012868,-0.026229,-0.031508,0.020493,0.027138,0.032884,-0.039353,0.043868,-0.030057,-0.030554,-0.053415,-0.057927,0.037622,-0.057874,0.048813,0.058536,0.032826,0.002815,-0.009563,-0.010988,-0.026045,-0.007782,-0.049423,0.015433,-0.005623,0.005190,0.080633,-0.051485,0.004279,-0.023949,-0.032112,-0.045076,-0.003263,-0.040169,-0.000813,0.047106,-0.021343,-0.069601,0.034598,-0.000318,0.071843,0.016701,-0.044663,0.010672,0.021560,-0.002855,-0.014092,0.043024,-0.057132,-0.043119,0.051453,-0.037315,0.004560,0.027751,-0.058274,-0.014906,-0.014855,-0.013570,0.028348,0.027222,0.050414,-0.018891,-0.000750,-0.039222,-0.030401,0.055620,-0.013600,-0.060789,-0.051981,0.041069,0.018455,0.061154,-0.009841,0.044431,-0.066305,-0.045908,-0.039208,0.002916,-0.057867,-0.015346,-0.015224,0.003053,-0.067642,-0.042824,-0.004842,0.057780,0.001895,0.002533,0.048597,-0.012151,0.022675,0.015651,0.043279,0.017596,0.057024,-0.022009,0.027201,...,-0.008428,-0.024401,-0.039502,-0.009557,-0.008109,0.024552,0.038099,0.035796,-0.037012,-0.017732,-0.007429,-0.001069,0.003595,-0.036941,-0.018137,-0.046503,0.017706,-0.003957,-0.066829,0.006648,0.010921,0.034615,0.028828,-0.045540,0.042557,0.020990,0.043798,-0.003862,0.003099,-0.015781,0.063749,0.000720,0.001920,-0.005164,-0.038341,-0.034480,0.038344,0.003700,-0.044490,-0.047315,-0.034226,0.029379,0.005234,0.032745,0.015239,-0.004715,-0.023521,-0.011705,-0.033745,0.018377,-0.075331,-0.034321,0.061852,0.001379,-0.029625,0.006074,0.022871,0.043592,-0.025232,0.026252,-0.016807,0.026511,0.028789,0.032878,-0.019982,-0.033732,-0.009207,-0.040880,0.012441,-0.025849,0.001041,-0.071529,-0.038895,0.027840,0.017326,-0.019277,-0.013809,0.028488,-0.037895,-0.064594,0.044065,-0.004190,0.025750,-0.074227,0.062246,0.015896,0.039011,-0.028284,0.044052,-0.007482,0.022898,-0.023076,-0.017118,-0.028610,-0.001833,0.034315,-0.053856,-0.017201,0.024917,-0.007657,-0.005138,-0.048995,0.028143,0.071245,-0.058475,0.031046,0.018292,0.040979,0.038795,-0.072059,0.015030,-0.024691,0.002755,0.018355,-0.020832,-0.004146,0.040031,-0.023122,0.006431,-0.004156,0.005641,0.017926,0.014959,0.041494,0.007740,0.036360,-0.038262,-0.057144
10,1,0.586648,0.562208,5.713414,0.255754,0.967295,-0.002543,0.029435,-0.007112,-0.043198,-0.023454,0.055567,-0.054406,0.015760,-0.046751,-0.008061,0.006914,-0.052569,-0.043407,-0.067387,0.037723,0.027766,-0.021145,0.000477,-0.013110,-0.056720,-0.035549,-0.022939,-0.025830,0.006101,0.001025,-0.010006,-0.008366,-0.028805,0.028508,0.010671,0.069422,-0.032081,0.021326,-0.059415,-0.041644,-0.046885,-0.068311,0.019375,-0.034709,0.020202,0.050740,0.016928,0.016345,-0.050038,0.014628,-0.022435,0.048175,-0.042369,-0.005621,0.011106,0.003171,0.080137,-0.062015,0.007644,-0.021215,-0.015075,-0.043192,-0.025854,-0.065235,-0.036629,0.040842,-0.023396,-0.050122,0.035380,0.027300,0.038739,0.064067,-0.033546,-0.034161,0.021614,-0.008504,-0.010217,0.023857,-0.020777,-0.008793,0.009624,-0.025385,0.010251,0.043669,-0.067134,0.000823,-0.006416,0.021069,0.038485,0.044857,0.026796,-0.058787,0.009123,0.022193,-0.007141,0.011485,0.005094,-0.063696,-0.031754,0.005702,0.002071,0.053142,-0.019981,0.025147,-0.040297,-0.058816,0.003888,-0.014271,-0.080474,-0.015057,-0.028321,-0.020863,-0.059217,-0.057723,-0.014121,0.046605,-0.049674,0.021837,0.033657,-0.040089,0.007360,-0.018662,0.022660,-0.000441,0.054951,0.023002,0.048733,...,-0.007086,-0.023420,0.008290,-0.020389,-0.032184,0.037010,0.049639,-0.012227,-0.060380,-0.005412,-0.023502,-0.012993,0.024636,-0.043780,-0.040901,-0.046006,0.044008,-0.012752,-0.068788,-0.030503,0.021307,0.048893,-0.017309,-0.018679,0.046388,-0.008700,0.036012,-0.011081,-0.038047,0.013688,0.064949,0.019558,-0.010367,-0.048382,-0.045805,-0.012113,0.047064,-0.014196,-0.010971,-0.043521,-0.048339,0.003000,-0.024299,0.001460,0.007800,0.017746,0.018435,-0.022465,-0.037267,0.021822,-0.078214,0.011793,0.055339,-0.024378,-0.053230,0.027740,-0.011357,0.060745,-0.012426,0.017595,-0.021998,-0.018652,0.071969,0.000742,0.027730,-0.037777,0.002225,-0.041560,0.026584,-0.043538,0.035339,-0.082260,-0.023910,0.004409,0.004803,-0.048353,0.000611,-0.002892,-0.026486,-0.049979,0.028916,0.002004,0.016706,-0.055852,0.063516,-0.002726,0.008624,-0.011100,0.025753,0.012176,0.010749,-0.031395,-0.049210,-0.017452,0.015796,0.021483,-0.029008,-0.039586,0.030173,-0.020549,0.023414,-0.024824,0.017403,0.060763,-0.062675,0.028367,0.014419,0.077169,0.018907,-0.053798,0.012386,-0.021474,-0.004572,0.030028,-0.018819,0.001568,0.031103,-0.020210,0.030866,0.022564,0.017403,0.029281,-0.021216,0.023711,0.019702,0.036239,-0.024460,-0.060940
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
306502,0,0.032249,0.022872,10.005867,0.447627,0.899815,0.056010,-0.076804,0.034580,0.025928,0.015691,-0.045512,0.032092,0.055506,0.036125,-0.050101,-0.011603,-0.011965,0.033964,0.001101,0.001397,-0.061245,0.014872,0.055374,-0.018247,0.070343,0.018241,0.009317,-0.032143,0.005847,-0.044296,-0.038245,-0.065260,0.000845,-0.044209,-0.053529,0.009558,0.056149,-0.010890,0.027366,0.025147,0.075185,0.041711,0.006748,0.017398,-0.015506,-0.044454,0.013579,-0.061247,0.063105,0.013958,-0.033996,0.045261,-0.003141,-0.049755,-0.011941,0.027828,-0.048506,0.020867,0.027695,0.003206,0.056903,-0.012797,-0.013339,-0.055300,0.040607,-0.062908,0.039063,-0.012097,0.027010,0.063172,0.022218,0.016318,-0.014944,-0.052275,-0.067452,0.014341,-0.003088,0.037448,0.092536,0.042769,-0.075309,0.027624,0.016710,0.029261,0.044668,0.018819,-0.028249,0.013294,0.019548,0.020976,-0.048731,-0.016818,-0.000817,0.022183,0.006495,0.001821,0.029473,0.044181,0.038410,-0.071627,-0.008846,-0.032057,-0.049664,0.003877,0.026820,0.054650,0.017063,-0.011557,0.045048,-0.018316,0.039139,-0.000940,-0.013164,0.034580,0.025877,0.004244,0.022246,0.040629,-0.023281,-0.013011,-0.024902,-0.044386,-0.018627,0.008529,-0.095881,0.025622,-0.006018,...,0.012744,0.010589,0.031754,-0.015384,-0.011318,0.011058,-0.033265,-0.042228,-0.007674,0.064002,-0.028255,0.048576,0.061077,0.063979,0.067575,-0.038208,0.003590,0.056113,-0.014470,-0.002290,0.014968,-0.078435,-0.009391,-0.001168,-0.041099,-0.017087,0.002853,-0.021604,0.010439,0.048851,-0.066803,0.009105,-0.015904,-0.021848,0.026196,0.009121,-0.101052,-0.025574,-0.025756,-0.011799,0.004435,0.037698,0.014782,-0.031761,-0.008820,0.068907,0.011035,-0.027293,0.035298,-0.045057,0.024590,0.034547,-0.056387,-0.054063,0.054254,-0.033329,0.035549,-0.093303,0.048542,0.006589,0.017421,-0.032151,-0.052271,-0.034202,0.014711,0.017900,0.038449,0.044164,0.030039,-0.026226,-0.000259,0.043949,0.041400,-0.007707,-0.011316,-0.014924,0.064976,-0.031895,0.025140,0.044708,-0.121946,-0.064670,0.033630,0.004864,-0.042619,-0.005033,-0.026241,0.023714,-0.042184,0.035559,0.048592,0.062731,-0.005488,-0.031287,-0.054078,0.020325,0.020917,0.061583,0.012419,0.038925,-0.002914,-0.009602,0.039648,-0.015208,0.010587,-0.034065,-0.041424,0.014251,-0.006455,0.040153,0.010028,-0.056752,-0.013475,-0.017837,-0.029297,-0.015036,0.022737,-0.031724,0.020371,-0.030408,-0.026954,-0.026964,0.043172,0.022116,-0.022970,0.020375,-0.008660,0.025996
306510,0,0.051367,0.044114,0.000023,0.000001,1.000000,-0.050865,-0.031015,0.018722,-0.013247,-0.007015,-0.001438,0.060876,0.008595,-0.000086,0.040194,0.045565,0.047728,0.066559,0.046900,-0.020905,-0.043894,0.021700,0.024734,-0.040810,0.048190,0.003155,0.032079,-0.007533,0.016612,-0.001901,-0.054207,0.047343,0.046870,-0.000010,-0.033504,-0.017791,0.023973,-0.032101,0.022877,0.008989,0.043942,0.044372,0.014075,0.047008,-0.011343,-0.022079,0.014303,0.057892,0.003959,0.068087,0.053398,0.010167,0.039353,-0.002445,0.020719,-0.033600,-0.044579,0.046746,-0.033660,0.006592,-0.022818,0.007504,0.033685,0.008406,-0.001022,-0.023820,0.038327,0.117806,-0.045111,-0.013626,-0.033596,0.006685,0.043201,0.010073,-0.055090,-0.000378,0.018014,0.005221,0.047580,0.054870,-0.080007,0.083941,0.000338,-0.014775,0.041413,-0.071506,-0.004589,0.003834,-0.018464,0.001319,-0.023922,-0.037112,0.015199,0.046244,0.070171,-0.020856,-0.038096,0.025565,-0.003845,-0.052621,0.014548,-0.066795,0.008206,-0.018747,-0.023714,0.025467,-0.012503,0.005283,0.069343,-0.005022,-0.005340,0.051992,0.023872,0.047948,-0.018372,-0.003062,0.012295,-0.024357,-0.002582,0.032028,-0.053571,-0.000584,-0.039673,0.029550,-0.059736,-0.015826,-0.020681,...,0.025092,0.033160,0.047982,-0.015328,0.013715,-0.072829,-0.067806,-0.012878,0.054996,0.019737,0.019778,0.026244,0.027084,-0.020200,0.050818,0.062497,-0.023755,0.031330,0.035394,0.011601,-0.027001,-0.066501,-0.010888,0.058965,0.000056,-0.045450,-0.026417,0.062099,-0.021291,0.020274,-0.048092,0.000469,0.028278,-0.008373,0.005604,-0.004870,-0.020536,-0.012359,-0.009372,0.079740,0.017159,-0.043916,-0.040549,-0.074100,-0.007627,0.027010,0.023364,0.017991,0.043084,-0.018178,-0.000096,-0.000925,0.002998,-0.010338,-0.002319,-0.028172,-0.038863,-0.007062,-0.012265,-0.050037,-0.007206,0.000824,0.012480,0.029110,-0.003362,0.009295,0.008680,0.032560,0.031583,-0.013468,0.047678,0.067149,0.022276,-0.004656,0.021134,0.005502,0.050163,0.001281,0.003921,-0.040420,-0.044105,-0.012305,-0.054858,0.002961,-0.042299,-0.008397,-0.020843,0.004527,-0.065203,-0.003076,-0.028711,0.069539,-0.019592,0.037724,0.000710,-0.046421,0.014620,0.030005,0.024736,-0.012060,0.038359,0.047357,-0.021529,-0.047348,0.028538,-0.051781,-0.010254,0.033528,-0.047558,0.062810,0.015283,0.009075,0.073817,0.012827,0.024458,0.006560,-0.054531,0.042832,0.021957,-0.010263,-0.003666,-0.052402,-0.044925,-0.045718,0.022304,-0.008546,0.032012,0.092396
306520,0,0.062628,0.050127,16.342211,0.731040,0.732790,0.005242,0.003479,-0.029729,0.039885,-0.004161,0.011517,-0.036403,-0.023161,-0.008929,-0.005896,-0.049205,0.015080,0.024623,-0.008088,-0.026518,-0.032968,0.040427,0.000908,0.007424,0.028720,0.062598,0.018748,0.020850,-0.035674,-0.012852,0.015354,0.029186,0.057610,-0.009595,-0.036153,-0.021760,0.028161,0.082542,0.015812,-0.014176,-0.029899,0.047409,-0.009764,-0.023901,0.086529,0.046957,-0.015014,-0.048800,0.030829,0.056233,-0.047996,-0.011856,0.007050,0.015007,0.027452,-0.037279,-0.052915,0.050831,0.021617,-0.031456,-0.025826,-0.025818,0.077926,0.021417,0.020376,0.055978,0.030775,-0.021502,0.001490,-0.062736,-0.013193,-0.060176,-0.036361,-0.001054,-0.036641,-0.042430,0.004310,0.044375,-0.030906,0.004094,0.028288,0.056508,-0.046493,-0.021365,0.040438,-0.020752,-0.095224,-0.062473,0.046843,-0.023215,0.005932,-0.014012,0.051034,-0.021183,0.006723,0.039353,-0.046128,0.017607,-0.058510,0.055644,0.078878,-0.048061,0.048270,0.010016,-0.055553,-0.032911,-0.043749,0.041022,0.075643,0.013501,0.002665,-0.023079,-0.001909,-0.010572,-0.057082,0.066056,0.100568,-0.041528,0.009566,0.038183,0.030685,0.005142,0.083886,0.007426,-0.007342,-0.043767,-0.019559,...,0.032073,-0.035867,0.017396,-0.055666,-0.003130,-0.094425,-0.057774,-0.003855,0.023185,0.089148,0.046222,0.034560,-0.030199,0.028059,-0.044640,0.008399,-0.013250,0.027017,0.009804,0.014189,0.047866,0.013160,-0.050283,0.022308,-0.020350,-0.032947,-0.002492,0.004575,0.012563,-0.010907,-0.020392,0.050547,-0.003233,0.013721,-0.000020,0.013318,0.010568,-0.028832,0.027966,0.014573,0.012100,0.022051,-0.032261,-0.026299,0.006704,-0.007572,-0.028757,0.031579,-0.023333,-0.104640,0.083893,0.058410,-0.051329,0.000338,-0.050883,-0.001439,0.041686,-0.020540,0.030508,0.013177,-0.015097,-0.030099,0.008000,0.024189,0.006307,-0.028177,0.026084,-0.025788,0.003592,-0.060611,-0.015756,0.015834,-0.011007,0.014228,0.033220,-0.014331,-0.010414,0.049656,0.039461,-0.014885,-0.020319,-0.025968,0.047154,-0.008120,-0.024034,0.038269,-0.034791,-0.046836,-0.048211,0.026159,-0.021349,0.034937,0.013592,0.009698,-0.021846,-0.012593,0.037986,0.089972,0.013925,0.004572,0.012262,0.029979,-0.003855,-0.043531,0.053273,-0.048587,-0.031057,-0.001021,-0.017115,-0.040246,0.035350,-0.021602,-0.050158,-0.049827,-0.030609,-0.027055,-0.066178,0.029000,0.057126,-0.023520,0.000863,-0.073448,-0.006929,0.012777,0.040339,-0.008867,-0.007924,0.045233
306524,0,0.085002,0.093381,13.459804,0.608179,0.815059,-0.008221,0.028781,-0.010265,-0.020548,0.004149,-0.039278,-0.033965,0.001442,-0.053117,0.000598,0.018433,0.014121,0.028930,0.028394,-0.010294,0.075339,-0.000376,-0.011648,0.041625,-0.003823,-0.004727,0.057036,0.067126,-0.021684,0.011994,0.030005,0.029314,0.044573,0.000091,-0.022247,-0.083943,0.022116,0.009667,-0.002522,0.045564,0.018317,-0.019917,-0.065640,0.046894,-0.001146,0.007392,-0.002764,-0.001841,-0.002508,-0.027677,-0.031856,-0.058305,0.023477,0.011714,-0.052623,-0.029041,0.004399,0.057382,-0.018191,-0.001771,0.023023,0.035488,0.045824,0.065526,-0.015425,0.029938,-0.011087,-0.047069,0.003081,0.001288,-0.064369,-0.029600,-0.083276,0.006656,0.013526,0.008740,-0.015723,-0.017357,-0.022938,-0.017357,0.011087,-0.075785,-0.036738,-0.117086,-0.005090,0.002627,0.004670,0.029854,-0.041048,-0.083283,-0.023112,0.056804,0.026565,-0.090755,-0.036275,0.007387,0.012658,-0.041975,0.095837,0.058722,-0.041985,-0.013796,0.038582,-0.059647,-0.028382,-0.023951,0.009361,0.028158,0.007045,0.048027,-0.025231,-0.031200,0.045548,0.021749,0.060186,0.004319,-0.039430,0.005055,-0.027388,0.056316,0.008466,0.066707,0.018477,-0.024866,0.055596,-0.006027,-0.000603,...,0.004082,0.062264,0.036715,0.013085,-0.061663,0.029231,0.026968,0.021985,0.009625,-0.036877,0.029948,-0.069046,-0.027174,-0.042737,0.000055,0.025274,-0.050671,-0.002161,-0.016153,0.027921,0.002322,0.009055,-0.019230,-0.053688,-0.013461,-0.011055,-0.019328,0.028780,-0.050839,0.057377,-0.009775,-0.027973,-0.067194,0.030454,0.019675,-0.007767,-0.003744,0.013415,-0.033516,0.010190,0.031751,-0.030995,-0.001198,0.042985,-0.028401,-0.000107,0.094621,0.034011,-0.010192,0.072673,-0.021434,0.003145,-0.004851,0.096263,-0.009279,-0.034404,0.010476,0.034907,0.047816,-0.020647,-0.001464,0.062482,-0.019521,0.024890,0.000822,-0.016405,0.041670,-0.043872,-0.004842,0.013114,0.020054,-0.003643,0.041445,-0.024140,-0.065033,0.076540,0.012762,-0.045842,-0.021350,0.035831,0.017240,0.002637,-0.011350,0.016579,-0.019019,-0.030286,0.030423,0.025078,-0.024305,-0.010502,-0.036411,0.013124,-0.030506,0.012118,-0.025669,0.005461,0.034463,-0.047225,0.004577,-0.066440,-0.001043,0.004656,-0.022448,0.046616,0.041505,0.003014,0.030455,0.033872,-0.070139,0.032361,0.031625,0.087255,0.028183,0.017979,0.016638,-0.006752,0.069967,-0.022660,0.018940,0.048998,-0.016503,0.058430,0.023628,0.060003,0.031661,0.013914,-0.030393,0.058795


In [57]:
cat_features = []
embedding_features = []

In [58]:
train_pool = Pool(
    data=all_train.drop('target', axis = 1),
    label=all_train['target'].values,
    cat_features=cat_features,
    embedding_features=embedding_features,
    baseline=all_train['cb_pseudo_pred']
)

val_pool = Pool(
    data=all_val.drop('target', axis = 1),
    label=all_val['target'].values,
    cat_features=cat_features,
    embedding_features=embedding_features,
    baseline=all_val['cb_pseudo_pred']
)

In [77]:
params = {
    'loss_function': 'CrossEntropy',
    'eval_metric': 'PRAUC',
    'task_type': 'CPU',
    'max_depth': 5,
    'learning_rate': 0.05
}

In [78]:
%%time
model_cb = CatBoostClassifier(**params, random_seed=56, cat_features=cat_features, embedding_features=embedding_features)
model_cb.fit(train_pool, eval_set=val_pool, verbose=250, plot=True, use_best_model=True, early_stopping_rounds=300)

MetricVisualizer(layout=Layout(align_self='stretch', height='500px'))

0:	learn: 0.9064039	test: 0.8999562	best: 0.8999562 (0)	total: 242ms	remaining: 4m 1s
250:	learn: 0.9121093	test: 0.9034555	best: 0.9034676 (232)	total: 26.2s	remaining: 1m 18s
500:	learn: 0.9162647	test: 0.9039775	best: 0.9039800 (484)	total: 51.4s	remaining: 51.1s
750:	learn: 0.9197125	test: 0.9040148	best: 0.9040510 (618)	total: 1m 16s	remaining: 25.4s
999:	learn: 0.9228259	test: 0.9040280	best: 0.9041264 (898)	total: 1m 41s	remaining: 0us

bestTest = 0.904126355
bestIteration = 898

Shrink model to first 899 iterations.
CPU times: total: 51min 46s
Wall time: 1min 43s


<catboost.core.CatBoostClassifier at 0x1ab9b596500>

In [79]:
np.max(model_cb.get_evals_result()['validation']['PRAUC'])

0.9041263550318052

In [70]:
model_cb.get_feature_importance(prettified=True)

Unnamed: 0,Feature Id,Importances
0,cb_pred,25.682825
1,cb_pseudo_pred,19.574883
2,neuro_l2_dist,3.803229
3,neuro_cos_dist,3.585549
4,neuro_l1_dist,2.026479
...,...,...
1536,neuro_emb747_2,0.000000
1537,neuro_emb748_2,0.000000
1538,neuro_emb754_2,0.000000
1539,neuro_emb758_2,0.000000


# Inference

In [47]:
test_df = make_features(test_pairs, test_data)
rtest_df = make_features(rtest_pairs, test_data)

In [48]:
test_pool = Pool(
    data=test_df,
    cat_features=cat_features,
    embedding_features=embedding_features,
    baseline=test_df['cb_pseudo_pred']
)

rtest_pool = Pool(
    data=rtest_df,
    cat_features=cat_features,
    embedding_features=embedding_features,
    baseline=rtest_df['cb_pseudo_pred']
)

In [49]:
preds = model_cb.predict_proba(test_pool)[:,1]
preds

array([0.06408981, 0.0779099 , 0.18736944, ..., 0.43052199, 0.87717535,
       0.45431952])

In [50]:
rpreds = model_cb.predict_proba(rtest_pool)[:,1]
rpreds

array([0.06408981, 0.0779099 , 0.18736944, ..., 0.43052199, 0.87717535,
       0.45431952])

In [51]:
final_preds = (preds + rpreds) / 2.
final_preds

array([0.06408981, 0.0779099 , 0.18736944, ..., 0.43052199, 0.87717535,
       0.45431952])

In [52]:
test_pairs['target'] = final_preds
test_pairs.to_csv('./golden_submit_ens.csv', index=False)
test_pairs.drop('target', axis=1, inplace=True)