In [61]:
import pandas as pd
import numpy as np
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.model_selection import train_test_split
from sklearn.naive_bayes import MultinomialNB
from sklearn.pipeline import Pipeline
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import roc_auc_score

from catboost import CatBoostClassifier

In [3]:
train = pd.read_csv('train_spam.csv')

In [4]:
train.head()

Unnamed: 0,text_type,text
0,ham,make sure alex knows his birthday is over in f...
1,ham,a resume for john lavorato thanks vince i will...
2,spam,plzz visit my website moviesgodml to get all m...
3,spam,urgent your mobile number has been awarded wit...
4,ham,overview of hr associates analyst project per ...


In [8]:
train.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 16278 entries, 0 to 16277
Data columns (total 2 columns):
 #   Column     Non-Null Count  Dtype 
---  ------     --------------  ----- 
 0   text_type  16278 non-null  object
 1   text       16278 non-null  object
dtypes: object(2)
memory usage: 254.5+ KB


In [10]:
train.isna().sum()

text_type    0
text         0
dtype: int64

In [13]:
train['spam'] = train['text_type'].apply(lambda x: 1 if x == 'spam' else 0)

In [15]:
train.head()

Unnamed: 0,text_type,text,spam
0,ham,make sure alex knows his birthday is over in f...,0
1,ham,a resume for john lavorato thanks vince i will...,0
2,spam,plzz visit my website moviesgodml to get all m...,1
3,spam,urgent your mobile number has been awarded wit...,1
4,ham,overview of hr associates analyst project per ...,0


In [85]:
X_train, X_test, y_train, y_test = train_test_split(train.text, train.spam, test_size=0.2, random_state=55)

In [146]:
vectorizer = CountVectorizer(binary=True, lowercase=False)
vectorizer.fit(X_train.to_list() + X_test.to_list() + test.text.to_list())

In [131]:
X_train_vectorized = vectorizer.transform(X_train)
X_test_vectorized = vectorizer.transform(X_test)

### Naive Bias

In [132]:
clf1 = MultinomialNB()

In [133]:
clf1.fit(X_train_vectorized, y_train)

In [134]:
roc_auc_score(y_test, clf1.predict(X_test_vectorized))

0.9004257552755183

### Gradient Boosting

In [150]:
clf2 = CatBoostClassifier(iterations=5000, learning_rate=0.1, depth=6, early_stopping_rounds=70)

In [151]:
clf2.fit(X_train_vectorized, y_train)

0:	learn: 0.6486968	total: 144ms	remaining: 12m 1s
1:	learn: 0.5920663	total: 286ms	remaining: 11m 54s
2:	learn: 0.5707758	total: 430ms	remaining: 11m 57s
3:	learn: 0.5493052	total: 562ms	remaining: 11m 42s
4:	learn: 0.5174074	total: 697ms	remaining: 11m 36s
5:	learn: 0.5038550	total: 829ms	remaining: 11m 29s
6:	learn: 0.4930506	total: 965ms	remaining: 11m 28s
7:	learn: 0.4825602	total: 1.1s	remaining: 11m 29s
8:	learn: 0.4744707	total: 1.26s	remaining: 11m 39s
9:	learn: 0.4657589	total: 1.42s	remaining: 11m 46s
10:	learn: 0.4583483	total: 1.59s	remaining: 12m 2s
11:	learn: 0.4520013	total: 1.75s	remaining: 12m 7s
12:	learn: 0.4462098	total: 1.9s	remaining: 12m 8s
13:	learn: 0.4397069	total: 2.04s	remaining: 12m 5s
14:	learn: 0.4288503	total: 2.23s	remaining: 12m 20s
15:	learn: 0.4218294	total: 2.4s	remaining: 12m 29s
16:	learn: 0.4167040	total: 2.55s	remaining: 12m 28s
17:	learn: 0.4085417	total: 2.69s	remaining: 12m 24s
18:	learn: 0.4044586	total: 2.83s	remaining: 12m 21s
19:	learn: 

156:	learn: 0.2144863	total: 21.9s	remaining: 11m 16s
157:	learn: 0.2136203	total: 22s	remaining: 11m 15s
158:	learn: 0.2129070	total: 22.2s	remaining: 11m 15s
159:	learn: 0.2116362	total: 22.4s	remaining: 11m 16s
160:	learn: 0.2109580	total: 22.5s	remaining: 11m 16s
161:	learn: 0.2101389	total: 22.6s	remaining: 11m 15s
162:	learn: 0.2099101	total: 22.8s	remaining: 11m 15s
163:	learn: 0.2093929	total: 22.9s	remaining: 11m 14s
164:	learn: 0.2089516	total: 23s	remaining: 11m 14s
165:	learn: 0.2085909	total: 23.1s	remaining: 11m 13s
166:	learn: 0.2080423	total: 23.3s	remaining: 11m 13s
167:	learn: 0.2078520	total: 23.4s	remaining: 11m 13s
168:	learn: 0.2073072	total: 23.5s	remaining: 11m 13s
169:	learn: 0.2070436	total: 23.7s	remaining: 11m 12s
170:	learn: 0.2066185	total: 23.8s	remaining: 11m 12s
171:	learn: 0.2059472	total: 23.9s	remaining: 11m 11s
172:	learn: 0.2052204	total: 24.1s	remaining: 11m 11s
173:	learn: 0.2045306	total: 24.2s	remaining: 11m 11s
174:	learn: 0.2043293	total: 24.

310:	learn: 0.1649214	total: 42.8s	remaining: 10m 44s
311:	learn: 0.1648478	total: 42.9s	remaining: 10m 44s
312:	learn: 0.1647743	total: 43s	remaining: 10m 44s
313:	learn: 0.1643414	total: 43.2s	remaining: 10m 44s
314:	learn: 0.1642358	total: 43.3s	remaining: 10m 44s
315:	learn: 0.1641653	total: 43.5s	remaining: 10m 44s
316:	learn: 0.1640920	total: 43.6s	remaining: 10m 43s
317:	learn: 0.1634830	total: 43.7s	remaining: 10m 43s
318:	learn: 0.1634103	total: 43.9s	remaining: 10m 43s
319:	learn: 0.1630543	total: 44s	remaining: 10m 43s
320:	learn: 0.1629586	total: 44.1s	remaining: 10m 43s
321:	learn: 0.1628868	total: 44.3s	remaining: 10m 42s
322:	learn: 0.1625740	total: 44.4s	remaining: 10m 42s
323:	learn: 0.1625021	total: 44.5s	remaining: 10m 42s
324:	learn: 0.1623604	total: 44.7s	remaining: 10m 42s
325:	learn: 0.1619510	total: 44.8s	remaining: 10m 42s
326:	learn: 0.1618803	total: 44.9s	remaining: 10m 41s
327:	learn: 0.1615495	total: 45.1s	remaining: 10m 41s
328:	learn: 0.1612585	total: 45.

464:	learn: 0.1398772	total: 1m 3s	remaining: 10m 19s
465:	learn: 0.1397995	total: 1m 3s	remaining: 10m 19s
466:	learn: 0.1397497	total: 1m 3s	remaining: 10m 19s
467:	learn: 0.1397010	total: 1m 3s	remaining: 10m 19s
468:	learn: 0.1394410	total: 1m 4s	remaining: 10m 19s
469:	learn: 0.1393917	total: 1m 4s	remaining: 10m 19s
470:	learn: 0.1391965	total: 1m 4s	remaining: 10m 18s
471:	learn: 0.1391469	total: 1m 4s	remaining: 10m 18s
472:	learn: 0.1389037	total: 1m 4s	remaining: 10m 18s
473:	learn: 0.1386290	total: 1m 4s	remaining: 10m 18s
474:	learn: 0.1382789	total: 1m 4s	remaining: 10m 18s
475:	learn: 0.1382295	total: 1m 5s	remaining: 10m 18s
476:	learn: 0.1377735	total: 1m 5s	remaining: 10m 17s
477:	learn: 0.1375912	total: 1m 5s	remaining: 10m 17s
478:	learn: 0.1372198	total: 1m 5s	remaining: 10m 17s
479:	learn: 0.1371701	total: 1m 5s	remaining: 10m 17s
480:	learn: 0.1370935	total: 1m 5s	remaining: 10m 17s
481:	learn: 0.1367210	total: 1m 5s	remaining: 10m 17s
482:	learn: 0.1366715	total:

616:	learn: 0.1221305	total: 1m 24s	remaining: 9m 58s
617:	learn: 0.1219856	total: 1m 24s	remaining: 9m 58s
618:	learn: 0.1218860	total: 1m 24s	remaining: 9m 58s
619:	learn: 0.1218273	total: 1m 24s	remaining: 9m 57s
620:	learn: 0.1217898	total: 1m 24s	remaining: 9m 57s
621:	learn: 0.1217529	total: 1m 24s	remaining: 9m 57s
622:	learn: 0.1214243	total: 1m 25s	remaining: 9m 57s
623:	learn: 0.1213872	total: 1m 25s	remaining: 9m 57s
624:	learn: 0.1213505	total: 1m 25s	remaining: 9m 57s
625:	learn: 0.1213137	total: 1m 25s	remaining: 9m 56s
626:	learn: 0.1212365	total: 1m 25s	remaining: 9m 56s
627:	learn: 0.1210961	total: 1m 25s	remaining: 9m 56s
628:	learn: 0.1208703	total: 1m 25s	remaining: 9m 56s
629:	learn: 0.1205873	total: 1m 25s	remaining: 9m 56s
630:	learn: 0.1205507	total: 1m 26s	remaining: 9m 56s
631:	learn: 0.1203440	total: 1m 26s	remaining: 9m 56s
632:	learn: 0.1201147	total: 1m 26s	remaining: 9m 55s
633:	learn: 0.1200190	total: 1m 26s	remaining: 9m 55s
634:	learn: 0.1199588	total:

768:	learn: 0.1080461	total: 1m 45s	remaining: 9m 40s
769:	learn: 0.1080164	total: 1m 45s	remaining: 9m 40s
770:	learn: 0.1079867	total: 1m 45s	remaining: 9m 40s
771:	learn: 0.1077170	total: 1m 45s	remaining: 9m 40s
772:	learn: 0.1074448	total: 1m 46s	remaining: 9m 40s
773:	learn: 0.1074150	total: 1m 46s	remaining: 9m 39s
774:	learn: 0.1073389	total: 1m 46s	remaining: 9m 39s
775:	learn: 0.1073105	total: 1m 46s	remaining: 9m 39s
776:	learn: 0.1072809	total: 1m 46s	remaining: 9m 39s
777:	learn: 0.1072516	total: 1m 46s	remaining: 9m 39s
778:	learn: 0.1072218	total: 1m 46s	remaining: 9m 39s
779:	learn: 0.1071761	total: 1m 47s	remaining: 9m 39s
780:	learn: 0.1071470	total: 1m 47s	remaining: 9m 39s
781:	learn: 0.1070866	total: 1m 47s	remaining: 9m 39s
782:	learn: 0.1070576	total: 1m 47s	remaining: 9m 39s
783:	learn: 0.1069903	total: 1m 47s	remaining: 9m 38s
784:	learn: 0.1069616	total: 1m 47s	remaining: 9m 38s
785:	learn: 0.1066253	total: 1m 47s	remaining: 9m 38s
786:	learn: 0.1065756	total:

922:	learn: 0.0965778	total: 2m 6s	remaining: 9m 20s
923:	learn: 0.0965540	total: 2m 7s	remaining: 9m 20s
924:	learn: 0.0965151	total: 2m 7s	remaining: 9m 20s
925:	learn: 0.0963284	total: 2m 7s	remaining: 9m 19s
926:	learn: 0.0963038	total: 2m 7s	remaining: 9m 19s
927:	learn: 0.0962198	total: 2m 7s	remaining: 9m 19s
928:	learn: 0.0961964	total: 2m 7s	remaining: 9m 19s
929:	learn: 0.0961726	total: 2m 7s	remaining: 9m 19s
930:	learn: 0.0960416	total: 2m 7s	remaining: 9m 19s
931:	learn: 0.0960047	total: 2m 8s	remaining: 9m 19s
932:	learn: 0.0959811	total: 2m 8s	remaining: 9m 18s
933:	learn: 0.0959178	total: 2m 8s	remaining: 9m 18s
934:	learn: 0.0958943	total: 2m 8s	remaining: 9m 18s
935:	learn: 0.0958709	total: 2m 8s	remaining: 9m 18s
936:	learn: 0.0957169	total: 2m 8s	remaining: 9m 18s
937:	learn: 0.0956936	total: 2m 8s	remaining: 9m 18s
938:	learn: 0.0956703	total: 2m 9s	remaining: 9m 18s
939:	learn: 0.0956326	total: 2m 9s	remaining: 9m 18s
940:	learn: 0.0956093	total: 2m 9s	remaining: 

1076:	learn: 0.0866841	total: 2m 27s	remaining: 8m 58s
1077:	learn: 0.0866649	total: 2m 28s	remaining: 8m 58s
1078:	learn: 0.0866456	total: 2m 28s	remaining: 8m 58s
1079:	learn: 0.0865673	total: 2m 28s	remaining: 8m 58s
1080:	learn: 0.0865063	total: 2m 28s	remaining: 8m 58s
1081:	learn: 0.0864879	total: 2m 28s	remaining: 8m 58s
1082:	learn: 0.0863874	total: 2m 28s	remaining: 8m 58s
1083:	learn: 0.0863678	total: 2m 28s	remaining: 8m 57s
1084:	learn: 0.0863365	total: 2m 29s	remaining: 8m 57s
1085:	learn: 0.0863175	total: 2m 29s	remaining: 8m 57s
1086:	learn: 0.0862985	total: 2m 29s	remaining: 8m 57s
1087:	learn: 0.0862796	total: 2m 29s	remaining: 8m 57s
1088:	learn: 0.0862430	total: 2m 29s	remaining: 8m 57s
1089:	learn: 0.0862244	total: 2m 29s	remaining: 8m 57s
1090:	learn: 0.0861912	total: 2m 29s	remaining: 8m 57s
1091:	learn: 0.0860954	total: 2m 30s	remaining: 8m 56s
1092:	learn: 0.0860653	total: 2m 30s	remaining: 8m 56s
1093:	learn: 0.0860466	total: 2m 30s	remaining: 8m 56s
1094:	lear

1226:	learn: 0.0787804	total: 2m 48s	remaining: 8m 39s
1227:	learn: 0.0787638	total: 2m 49s	remaining: 8m 39s
1228:	learn: 0.0787474	total: 2m 49s	remaining: 8m 39s
1229:	learn: 0.0786223	total: 2m 49s	remaining: 8m 39s
1230:	learn: 0.0785660	total: 2m 49s	remaining: 8m 38s
1231:	learn: 0.0785499	total: 2m 49s	remaining: 8m 38s
1232:	learn: 0.0784606	total: 2m 49s	remaining: 8m 38s
1233:	learn: 0.0784441	total: 2m 49s	remaining: 8m 38s
1234:	learn: 0.0783971	total: 2m 50s	remaining: 8m 38s
1235:	learn: 0.0783201	total: 2m 50s	remaining: 8m 38s
1236:	learn: 0.0782693	total: 2m 50s	remaining: 8m 38s
1237:	learn: 0.0782531	total: 2m 50s	remaining: 8m 38s
1238:	learn: 0.0782070	total: 2m 50s	remaining: 8m 38s
1239:	learn: 0.0781908	total: 2m 50s	remaining: 8m 37s
1240:	learn: 0.0781646	total: 2m 50s	remaining: 8m 37s
1241:	learn: 0.0781376	total: 2m 51s	remaining: 8m 37s
1242:	learn: 0.0780540	total: 2m 51s	remaining: 8m 37s
1243:	learn: 0.0780378	total: 2m 51s	remaining: 8m 37s
1244:	lear

1378:	learn: 0.0727295	total: 3m 9s	remaining: 8m 18s
1379:	learn: 0.0727156	total: 3m 10s	remaining: 8m 18s
1380:	learn: 0.0727019	total: 3m 10s	remaining: 8m 18s
1381:	learn: 0.0725318	total: 3m 10s	remaining: 8m 18s
1382:	learn: 0.0724587	total: 3m 10s	remaining: 8m 18s
1383:	learn: 0.0724448	total: 3m 10s	remaining: 8m 18s
1384:	learn: 0.0722644	total: 3m 10s	remaining: 8m 17s
1385:	learn: 0.0722148	total: 3m 10s	remaining: 8m 17s
1386:	learn: 0.0722011	total: 3m 11s	remaining: 8m 17s
1387:	learn: 0.0721873	total: 3m 11s	remaining: 8m 17s
1388:	learn: 0.0720223	total: 3m 11s	remaining: 8m 17s
1389:	learn: 0.0719983	total: 3m 11s	remaining: 8m 17s
1390:	learn: 0.0718955	total: 3m 11s	remaining: 8m 17s
1391:	learn: 0.0718821	total: 3m 11s	remaining: 8m 16s
1392:	learn: 0.0718681	total: 3m 11s	remaining: 8m 16s
1393:	learn: 0.0717306	total: 3m 12s	remaining: 8m 16s
1394:	learn: 0.0717106	total: 3m 12s	remaining: 8m 16s
1395:	learn: 0.0716969	total: 3m 12s	remaining: 8m 16s
1396:	learn

1530:	learn: 0.0667599	total: 3m 30s	remaining: 7m 57s
1531:	learn: 0.0667482	total: 3m 31s	remaining: 7m 57s
1532:	learn: 0.0667366	total: 3m 31s	remaining: 7m 57s
1533:	learn: 0.0666408	total: 3m 31s	remaining: 7m 57s
1534:	learn: 0.0666290	total: 3m 31s	remaining: 7m 57s
1535:	learn: 0.0664595	total: 3m 31s	remaining: 7m 57s
1536:	learn: 0.0664346	total: 3m 31s	remaining: 7m 57s
1537:	learn: 0.0664126	total: 3m 31s	remaining: 7m 56s
1538:	learn: 0.0664009	total: 3m 32s	remaining: 7m 56s
1539:	learn: 0.0663893	total: 3m 32s	remaining: 7m 56s
1540:	learn: 0.0663777	total: 3m 32s	remaining: 7m 56s
1541:	learn: 0.0663661	total: 3m 32s	remaining: 7m 56s
1542:	learn: 0.0663449	total: 3m 32s	remaining: 7m 56s
1543:	learn: 0.0663258	total: 3m 32s	remaining: 7m 56s
1544:	learn: 0.0662253	total: 3m 32s	remaining: 7m 55s
1545:	learn: 0.0661283	total: 3m 32s	remaining: 7m 55s
1546:	learn: 0.0661166	total: 3m 33s	remaining: 7m 55s
1547:	learn: 0.0661051	total: 3m 33s	remaining: 7m 55s
1548:	lear

1680:	learn: 0.0618634	total: 3m 51s	remaining: 7m 37s
1681:	learn: 0.0618533	total: 3m 51s	remaining: 7m 36s
1682:	learn: 0.0617446	total: 3m 51s	remaining: 7m 36s
1683:	learn: 0.0617276	total: 3m 51s	remaining: 7m 36s
1684:	learn: 0.0617174	total: 3m 52s	remaining: 7m 36s
1685:	learn: 0.0617070	total: 3m 52s	remaining: 7m 36s
1686:	learn: 0.0616260	total: 3m 52s	remaining: 7m 36s
1687:	learn: 0.0616004	total: 3m 52s	remaining: 7m 36s
1688:	learn: 0.0615902	total: 3m 52s	remaining: 7m 35s
1689:	learn: 0.0615745	total: 3m 52s	remaining: 7m 35s
1690:	learn: 0.0614973	total: 3m 52s	remaining: 7m 35s
1691:	learn: 0.0614870	total: 3m 53s	remaining: 7m 35s
1692:	learn: 0.0614768	total: 3m 53s	remaining: 7m 35s
1693:	learn: 0.0614666	total: 3m 53s	remaining: 7m 35s
1694:	learn: 0.0613928	total: 3m 53s	remaining: 7m 35s
1695:	learn: 0.0613825	total: 3m 53s	remaining: 7m 35s
1696:	learn: 0.0613725	total: 3m 53s	remaining: 7m 35s
1697:	learn: 0.0613625	total: 3m 53s	remaining: 7m 34s
1698:	lear

1832:	learn: 0.0574070	total: 4m 12s	remaining: 7m 16s
1833:	learn: 0.0573982	total: 4m 12s	remaining: 7m 15s
1834:	learn: 0.0573819	total: 4m 12s	remaining: 7m 15s
1835:	learn: 0.0573273	total: 4m 12s	remaining: 7m 15s
1836:	learn: 0.0573060	total: 4m 12s	remaining: 7m 15s
1837:	learn: 0.0572972	total: 4m 13s	remaining: 7m 15s
1838:	learn: 0.0572358	total: 4m 13s	remaining: 7m 15s
1839:	learn: 0.0572276	total: 4m 13s	remaining: 7m 15s
1840:	learn: 0.0572188	total: 4m 13s	remaining: 7m 14s
1841:	learn: 0.0572105	total: 4m 13s	remaining: 7m 14s
1842:	learn: 0.0572019	total: 4m 13s	remaining: 7m 14s
1843:	learn: 0.0571315	total: 4m 13s	remaining: 7m 14s
1844:	learn: 0.0571024	total: 4m 13s	remaining: 7m 14s
1845:	learn: 0.0569994	total: 4m 14s	remaining: 7m 14s
1846:	learn: 0.0569670	total: 4m 14s	remaining: 7m 14s
1847:	learn: 0.0569582	total: 4m 14s	remaining: 7m 13s
1848:	learn: 0.0569494	total: 4m 14s	remaining: 7m 13s
1849:	learn: 0.0569205	total: 4m 14s	remaining: 7m 13s
1850:	lear

1984:	learn: 0.0535539	total: 4m 33s	remaining: 6m 55s
1985:	learn: 0.0535462	total: 4m 33s	remaining: 6m 55s
1986:	learn: 0.0534768	total: 4m 33s	remaining: 6m 55s
1987:	learn: 0.0534511	total: 4m 33s	remaining: 6m 55s
1988:	learn: 0.0534433	total: 4m 34s	remaining: 6m 54s
1989:	learn: 0.0533841	total: 4m 34s	remaining: 6m 54s
1990:	learn: 0.0533763	total: 4m 34s	remaining: 6m 54s
1991:	learn: 0.0533685	total: 4m 34s	remaining: 6m 54s
1992:	learn: 0.0533607	total: 4m 34s	remaining: 6m 54s
1993:	learn: 0.0533532	total: 4m 34s	remaining: 6m 54s
1994:	learn: 0.0533454	total: 4m 34s	remaining: 6m 54s
1995:	learn: 0.0532483	total: 4m 35s	remaining: 6m 53s
1996:	learn: 0.0532284	total: 4m 35s	remaining: 6m 53s
1997:	learn: 0.0532207	total: 4m 35s	remaining: 6m 53s
1998:	learn: 0.0532049	total: 4m 35s	remaining: 6m 53s
1999:	learn: 0.0531971	total: 4m 35s	remaining: 6m 53s
2000:	learn: 0.0531895	total: 4m 35s	remaining: 6m 53s
2001:	learn: 0.0531818	total: 4m 35s	remaining: 6m 53s
2002:	lear

2134:	learn: 0.0502124	total: 4m 54s	remaining: 6m 35s
2135:	learn: 0.0502054	total: 4m 54s	remaining: 6m 35s
2136:	learn: 0.0501624	total: 4m 55s	remaining: 6m 35s
2137:	learn: 0.0501557	total: 4m 55s	remaining: 6m 35s
2138:	learn: 0.0501417	total: 4m 55s	remaining: 6m 35s
2139:	learn: 0.0501239	total: 4m 55s	remaining: 6m 35s
2140:	learn: 0.0501172	total: 4m 55s	remaining: 6m 34s
2141:	learn: 0.0501005	total: 4m 55s	remaining: 6m 34s
2142:	learn: 0.0500935	total: 4m 56s	remaining: 6m 34s
2143:	learn: 0.0500727	total: 4m 56s	remaining: 6m 34s
2144:	learn: 0.0500662	total: 4m 56s	remaining: 6m 34s
2145:	learn: 0.0500597	total: 4m 56s	remaining: 6m 34s
2146:	learn: 0.0499848	total: 4m 56s	remaining: 6m 34s
2147:	learn: 0.0499728	total: 4m 56s	remaining: 6m 34s
2148:	learn: 0.0499661	total: 4m 56s	remaining: 6m 33s
2149:	learn: 0.0499547	total: 4m 57s	remaining: 6m 33s
2150:	learn: 0.0499308	total: 4m 57s	remaining: 6m 33s
2151:	learn: 0.0498849	total: 4m 57s	remaining: 6m 33s
2152:	lear

2286:	learn: 0.0472310	total: 5m 16s	remaining: 6m 14s
2287:	learn: 0.0471891	total: 5m 16s	remaining: 6m 14s
2288:	learn: 0.0471831	total: 5m 16s	remaining: 6m 14s
2289:	learn: 0.0471703	total: 5m 16s	remaining: 6m 14s
2290:	learn: 0.0471597	total: 5m 16s	remaining: 6m 14s
2291:	learn: 0.0471226	total: 5m 16s	remaining: 6m 14s
2292:	learn: 0.0471166	total: 5m 16s	remaining: 6m 14s
2293:	learn: 0.0470505	total: 5m 16s	remaining: 6m 13s
2294:	learn: 0.0470444	total: 5m 17s	remaining: 6m 13s
2295:	learn: 0.0469875	total: 5m 17s	remaining: 6m 13s
2296:	learn: 0.0469813	total: 5m 17s	remaining: 6m 13s
2297:	learn: 0.0469104	total: 5m 17s	remaining: 6m 13s
2298:	learn: 0.0468958	total: 5m 17s	remaining: 6m 13s
2299:	learn: 0.0468898	total: 5m 17s	remaining: 6m 13s
2300:	learn: 0.0468837	total: 5m 17s	remaining: 6m 12s
2301:	learn: 0.0467829	total: 5m 18s	remaining: 6m 12s
2302:	learn: 0.0467684	total: 5m 18s	remaining: 6m 12s
2303:	learn: 0.0467622	total: 5m 18s	remaining: 6m 12s
2304:	lear

2438:	learn: 0.0445236	total: 5m 36s	remaining: 5m 53s
2439:	learn: 0.0445183	total: 5m 36s	remaining: 5m 53s
2440:	learn: 0.0445070	total: 5m 36s	remaining: 5m 53s
2441:	learn: 0.0445015	total: 5m 37s	remaining: 5m 53s
2442:	learn: 0.0444489	total: 5m 37s	remaining: 5m 52s
2443:	learn: 0.0444436	total: 5m 37s	remaining: 5m 52s
2444:	learn: 0.0444341	total: 5m 37s	remaining: 5m 52s
2445:	learn: 0.0444198	total: 5m 37s	remaining: 5m 52s
2446:	learn: 0.0444143	total: 5m 37s	remaining: 5m 52s
2447:	learn: 0.0443400	total: 5m 37s	remaining: 5m 52s
2448:	learn: 0.0443295	total: 5m 38s	remaining: 5m 52s
2449:	learn: 0.0443239	total: 5m 38s	remaining: 5m 51s
2450:	learn: 0.0442913	total: 5m 38s	remaining: 5m 51s
2451:	learn: 0.0442855	total: 5m 38s	remaining: 5m 51s
2452:	learn: 0.0442803	total: 5m 38s	remaining: 5m 51s
2453:	learn: 0.0442749	total: 5m 38s	remaining: 5m 51s
2454:	learn: 0.0442695	total: 5m 38s	remaining: 5m 51s
2455:	learn: 0.0442641	total: 5m 38s	remaining: 5m 51s
2456:	lear

2588:	learn: 0.0420843	total: 5m 57s	remaining: 5m 32s
2589:	learn: 0.0420790	total: 5m 57s	remaining: 5m 32s
2590:	learn: 0.0420741	total: 5m 57s	remaining: 5m 32s
2591:	learn: 0.0420640	total: 5m 57s	remaining: 5m 32s
2592:	learn: 0.0420591	total: 5m 57s	remaining: 5m 31s
2593:	learn: 0.0420542	total: 5m 57s	remaining: 5m 31s
2594:	learn: 0.0420493	total: 5m 57s	remaining: 5m 31s
2595:	learn: 0.0420444	total: 5m 58s	remaining: 5m 31s
2596:	learn: 0.0420281	total: 5m 58s	remaining: 5m 31s
2597:	learn: 0.0420234	total: 5m 58s	remaining: 5m 31s
2598:	learn: 0.0420128	total: 5m 58s	remaining: 5m 31s
2599:	learn: 0.0420027	total: 5m 58s	remaining: 5m 30s
2600:	learn: 0.0419522	total: 5m 58s	remaining: 5m 30s
2601:	learn: 0.0419428	total: 5m 58s	remaining: 5m 30s
2602:	learn: 0.0419380	total: 5m 58s	remaining: 5m 30s
2603:	learn: 0.0419331	total: 5m 59s	remaining: 5m 30s
2604:	learn: 0.0419284	total: 5m 59s	remaining: 5m 30s
2605:	learn: 0.0419235	total: 5m 59s	remaining: 5m 30s
2606:	lear

2740:	learn: 0.0399409	total: 6m 17s	remaining: 5m 11s
2741:	learn: 0.0399365	total: 6m 18s	remaining: 5m 11s
2742:	learn: 0.0399320	total: 6m 18s	remaining: 5m 11s
2743:	learn: 0.0399277	total: 6m 18s	remaining: 5m 11s
2744:	learn: 0.0398984	total: 6m 18s	remaining: 5m 10s
2745:	learn: 0.0398906	total: 6m 18s	remaining: 5m 10s
2746:	learn: 0.0398844	total: 6m 18s	remaining: 5m 10s
2747:	learn: 0.0398517	total: 6m 18s	remaining: 5m 10s
2748:	learn: 0.0398474	total: 6m 19s	remaining: 5m 10s
2749:	learn: 0.0398429	total: 6m 19s	remaining: 5m 10s
2750:	learn: 0.0398386	total: 6m 19s	remaining: 5m 10s
2751:	learn: 0.0397854	total: 6m 19s	remaining: 5m 10s
2752:	learn: 0.0397808	total: 6m 19s	remaining: 5m 9s
2753:	learn: 0.0397765	total: 6m 19s	remaining: 5m 9s
2754:	learn: 0.0397720	total: 6m 19s	remaining: 5m 9s
2755:	learn: 0.0397255	total: 6m 20s	remaining: 5m 9s
2756:	learn: 0.0397209	total: 6m 20s	remaining: 5m 9s
2757:	learn: 0.0397020	total: 6m 20s	remaining: 5m 9s
2758:	learn: 0.0

2892:	learn: 0.0379419	total: 6m 39s	remaining: 4m 50s
2893:	learn: 0.0379092	total: 6m 39s	remaining: 4m 50s
2894:	learn: 0.0378883	total: 6m 39s	remaining: 4m 50s
2895:	learn: 0.0378844	total: 6m 39s	remaining: 4m 50s
2896:	learn: 0.0378803	total: 6m 39s	remaining: 4m 50s
2897:	learn: 0.0378763	total: 6m 39s	remaining: 4m 50s
2898:	learn: 0.0378605	total: 6m 40s	remaining: 4m 49s
2899:	learn: 0.0378472	total: 6m 40s	remaining: 4m 49s
2900:	learn: 0.0378052	total: 6m 40s	remaining: 4m 49s
2901:	learn: 0.0377982	total: 6m 40s	remaining: 4m 49s
2902:	learn: 0.0377942	total: 6m 40s	remaining: 4m 49s
2903:	learn: 0.0377902	total: 6m 40s	remaining: 4m 49s
2904:	learn: 0.0377796	total: 6m 40s	remaining: 4m 49s
2905:	learn: 0.0377757	total: 6m 41s	remaining: 4m 48s
2906:	learn: 0.0377717	total: 6m 41s	remaining: 4m 48s
2907:	learn: 0.0377621	total: 6m 41s	remaining: 4m 48s
2908:	learn: 0.0377549	total: 6m 41s	remaining: 4m 48s
2909:	learn: 0.0377439	total: 6m 41s	remaining: 4m 48s
2910:	lear

3042:	learn: 0.0360758	total: 7m 2s	remaining: 4m 31s
3043:	learn: 0.0360722	total: 7m 2s	remaining: 4m 31s
3044:	learn: 0.0359760	total: 7m 2s	remaining: 4m 31s
3045:	learn: 0.0359654	total: 7m 2s	remaining: 4m 31s
3046:	learn: 0.0359266	total: 7m 2s	remaining: 4m 30s
3047:	learn: 0.0359228	total: 7m 2s	remaining: 4m 30s
3048:	learn: 0.0359191	total: 7m 2s	remaining: 4m 30s
3049:	learn: 0.0359155	total: 7m 3s	remaining: 4m 30s
3050:	learn: 0.0359118	total: 7m 3s	remaining: 4m 30s
3051:	learn: 0.0359082	total: 7m 3s	remaining: 4m 30s
3052:	learn: 0.0359045	total: 7m 3s	remaining: 4m 30s
3053:	learn: 0.0358870	total: 7m 3s	remaining: 4m 29s
3054:	learn: 0.0358540	total: 7m 3s	remaining: 4m 29s
3055:	learn: 0.0358461	total: 7m 3s	remaining: 4m 29s
3056:	learn: 0.0358147	total: 7m 4s	remaining: 4m 29s
3057:	learn: 0.0358109	total: 7m 4s	remaining: 4m 29s
3058:	learn: 0.0358073	total: 7m 4s	remaining: 4m 29s
3059:	learn: 0.0358037	total: 7m 4s	remaining: 4m 29s
3060:	learn: 0.0357766	total

3193:	learn: 0.0342225	total: 7m 26s	remaining: 4m 12s
3194:	learn: 0.0342163	total: 7m 26s	remaining: 4m 12s
3195:	learn: 0.0341725	total: 7m 26s	remaining: 4m 12s
3196:	learn: 0.0341636	total: 7m 26s	remaining: 4m 11s
3197:	learn: 0.0341603	total: 7m 26s	remaining: 4m 11s
3198:	learn: 0.0341568	total: 7m 26s	remaining: 4m 11s
3199:	learn: 0.0341536	total: 7m 27s	remaining: 4m 11s
3200:	learn: 0.0341501	total: 7m 27s	remaining: 4m 11s
3201:	learn: 0.0341052	total: 7m 27s	remaining: 4m 11s
3202:	learn: 0.0341012	total: 7m 27s	remaining: 4m 11s
3203:	learn: 0.0340952	total: 7m 27s	remaining: 4m 10s
3204:	learn: 0.0340918	total: 7m 27s	remaining: 4m 10s
3205:	learn: 0.0340886	total: 7m 28s	remaining: 4m 10s
3206:	learn: 0.0340853	total: 7m 28s	remaining: 4m 10s
3207:	learn: 0.0340820	total: 7m 28s	remaining: 4m 10s
3208:	learn: 0.0340732	total: 7m 28s	remaining: 4m 10s
3209:	learn: 0.0340697	total: 7m 28s	remaining: 4m 10s
3210:	learn: 0.0340665	total: 7m 28s	remaining: 4m 10s
3211:	lear

3344:	learn: 0.0327483	total: 7m 48s	remaining: 3m 51s
3345:	learn: 0.0327174	total: 7m 48s	remaining: 3m 51s
3346:	learn: 0.0327116	total: 7m 48s	remaining: 3m 51s
3347:	learn: 0.0327086	total: 7m 48s	remaining: 3m 51s
3348:	learn: 0.0326854	total: 7m 48s	remaining: 3m 51s
3349:	learn: 0.0326823	total: 7m 48s	remaining: 3m 50s
3350:	learn: 0.0325947	total: 7m 49s	remaining: 3m 50s
3351:	learn: 0.0325910	total: 7m 49s	remaining: 3m 50s
3352:	learn: 0.0325880	total: 7m 49s	remaining: 3m 50s
3353:	learn: 0.0325849	total: 7m 49s	remaining: 3m 50s
3354:	learn: 0.0325764	total: 7m 49s	remaining: 3m 50s
3355:	learn: 0.0325734	total: 7m 49s	remaining: 3m 50s
3356:	learn: 0.0325664	total: 7m 49s	remaining: 3m 49s
3357:	learn: 0.0325634	total: 7m 49s	remaining: 3m 49s
3358:	learn: 0.0325563	total: 7m 50s	remaining: 3m 49s
3359:	learn: 0.0325531	total: 7m 50s	remaining: 3m 49s
3360:	learn: 0.0325384	total: 7m 50s	remaining: 3m 49s
3361:	learn: 0.0325187	total: 7m 50s	remaining: 3m 49s
3362:	lear

3496:	learn: 0.0311293	total: 8m 10s	remaining: 3m 30s
3497:	learn: 0.0311098	total: 8m 10s	remaining: 3m 30s
3498:	learn: 0.0311049	total: 8m 10s	remaining: 3m 30s
3499:	learn: 0.0311020	total: 8m 11s	remaining: 3m 30s
3500:	learn: 0.0310993	total: 8m 11s	remaining: 3m 30s
3501:	learn: 0.0310869	total: 8m 11s	remaining: 3m 30s
3502:	learn: 0.0310842	total: 8m 11s	remaining: 3m 30s
3503:	learn: 0.0310204	total: 8m 11s	remaining: 3m 29s
3504:	learn: 0.0310095	total: 8m 11s	remaining: 3m 29s
3505:	learn: 0.0310066	total: 8m 12s	remaining: 3m 29s
3506:	learn: 0.0310038	total: 8m 12s	remaining: 3m 29s
3507:	learn: 0.0309874	total: 8m 12s	remaining: 3m 29s
3508:	learn: 0.0309845	total: 8m 12s	remaining: 3m 29s
3509:	learn: 0.0309541	total: 8m 12s	remaining: 3m 29s
3510:	learn: 0.0309512	total: 8m 12s	remaining: 3m 28s
3511:	learn: 0.0309484	total: 8m 12s	remaining: 3m 28s
3512:	learn: 0.0309415	total: 8m 13s	remaining: 3m 28s
3513:	learn: 0.0309257	total: 8m 13s	remaining: 3m 28s
3514:	lear

3646:	learn: 0.0298490	total: 8m 32s	remaining: 3m 10s
3647:	learn: 0.0298463	total: 8m 32s	remaining: 3m 9s
3648:	learn: 0.0298418	total: 8m 32s	remaining: 3m 9s
3649:	learn: 0.0298391	total: 8m 32s	remaining: 3m 9s
3650:	learn: 0.0298366	total: 8m 32s	remaining: 3m 9s
3651:	learn: 0.0298341	total: 8m 33s	remaining: 3m 9s
3652:	learn: 0.0298181	total: 8m 33s	remaining: 3m 9s
3653:	learn: 0.0298107	total: 8m 33s	remaining: 3m 9s
3654:	learn: 0.0297977	total: 8m 33s	remaining: 3m 8s
3655:	learn: 0.0297952	total: 8m 33s	remaining: 3m 8s
3656:	learn: 0.0297868	total: 8m 33s	remaining: 3m 8s
3657:	learn: 0.0297824	total: 8m 33s	remaining: 3m 8s
3658:	learn: 0.0297791	total: 8m 34s	remaining: 3m 8s
3659:	learn: 0.0297765	total: 8m 34s	remaining: 3m 8s
3660:	learn: 0.0297740	total: 8m 34s	remaining: 3m 8s
3661:	learn: 0.0297714	total: 8m 34s	remaining: 3m 7s
3662:	learn: 0.0297599	total: 8m 34s	remaining: 3m 7s
3663:	learn: 0.0297574	total: 8m 34s	remaining: 3m 7s
3664:	learn: 0.0297549	tota

3798:	learn: 0.0286524	total: 8m 53s	remaining: 2m 48s
3799:	learn: 0.0286478	total: 8m 53s	remaining: 2m 48s
3800:	learn: 0.0286455	total: 8m 53s	remaining: 2m 48s
3801:	learn: 0.0286415	total: 8m 53s	remaining: 2m 48s
3802:	learn: 0.0286391	total: 8m 54s	remaining: 2m 48s
3803:	learn: 0.0286323	total: 8m 54s	remaining: 2m 47s
3804:	learn: 0.0286298	total: 8m 54s	remaining: 2m 47s
3805:	learn: 0.0286133	total: 8m 54s	remaining: 2m 47s
3806:	learn: 0.0286111	total: 8m 54s	remaining: 2m 47s
3807:	learn: 0.0285999	total: 8m 54s	remaining: 2m 47s
3808:	learn: 0.0285976	total: 8m 54s	remaining: 2m 47s
3809:	learn: 0.0285953	total: 8m 54s	remaining: 2m 47s
3810:	learn: 0.0285832	total: 8m 55s	remaining: 2m 46s
3811:	learn: 0.0285809	total: 8m 55s	remaining: 2m 46s
3812:	learn: 0.0285760	total: 8m 55s	remaining: 2m 46s
3813:	learn: 0.0285556	total: 8m 55s	remaining: 2m 46s
3814:	learn: 0.0285532	total: 8m 55s	remaining: 2m 46s
3815:	learn: 0.0285488	total: 8m 55s	remaining: 2m 46s
3816:	lear

3949:	learn: 0.0274741	total: 9m 16s	remaining: 2m 27s
3950:	learn: 0.0274680	total: 9m 16s	remaining: 2m 27s
3951:	learn: 0.0274576	total: 9m 16s	remaining: 2m 27s
3952:	learn: 0.0274555	total: 9m 16s	remaining: 2m 27s
3953:	learn: 0.0274533	total: 9m 16s	remaining: 2m 27s
3954:	learn: 0.0274502	total: 9m 17s	remaining: 2m 27s
3955:	learn: 0.0274460	total: 9m 17s	remaining: 2m 27s
3956:	learn: 0.0274417	total: 9m 17s	remaining: 2m 26s
3957:	learn: 0.0274395	total: 9m 17s	remaining: 2m 26s
3958:	learn: 0.0274216	total: 9m 17s	remaining: 2m 26s
3959:	learn: 0.0274020	total: 9m 17s	remaining: 2m 26s
3960:	learn: 0.0273997	total: 9m 17s	remaining: 2m 26s
3961:	learn: 0.0273976	total: 9m 18s	remaining: 2m 26s
3962:	learn: 0.0273841	total: 9m 18s	remaining: 2m 26s
3963:	learn: 0.0273801	total: 9m 18s	remaining: 2m 25s
3964:	learn: 0.0273780	total: 9m 18s	remaining: 2m 25s
3965:	learn: 0.0273731	total: 9m 18s	remaining: 2m 25s
3966:	learn: 0.0273651	total: 9m 18s	remaining: 2m 25s
3967:	lear

4099:	learn: 0.0264545	total: 9m 38s	remaining: 2m 7s
4100:	learn: 0.0264484	total: 9m 39s	remaining: 2m 6s
4101:	learn: 0.0264399	total: 9m 39s	remaining: 2m 6s
4102:	learn: 0.0264379	total: 9m 39s	remaining: 2m 6s
4103:	learn: 0.0264360	total: 9m 39s	remaining: 2m 6s
4104:	learn: 0.0264339	total: 9m 39s	remaining: 2m 6s
4105:	learn: 0.0264087	total: 9m 39s	remaining: 2m 6s
4106:	learn: 0.0264065	total: 9m 40s	remaining: 2m 6s
4107:	learn: 0.0264045	total: 9m 40s	remaining: 2m 5s
4108:	learn: 0.0264025	total: 9m 40s	remaining: 2m 5s
4109:	learn: 0.0264005	total: 9m 40s	remaining: 2m 5s
4110:	learn: 0.0263985	total: 9m 40s	remaining: 2m 5s
4111:	learn: 0.0263964	total: 9m 40s	remaining: 2m 5s
4112:	learn: 0.0263674	total: 9m 41s	remaining: 2m 5s
4113:	learn: 0.0263639	total: 9m 41s	remaining: 2m 5s
4114:	learn: 0.0263618	total: 9m 41s	remaining: 2m 5s
4115:	learn: 0.0263598	total: 9m 41s	remaining: 2m 4s
4116:	learn: 0.0263496	total: 9m 41s	remaining: 2m 4s
4117:	learn: 0.0263336	total

4251:	learn: 0.0254565	total: 10m 4s	remaining: 1m 46s
4252:	learn: 0.0254545	total: 10m 4s	remaining: 1m 46s
4253:	learn: 0.0254512	total: 10m 4s	remaining: 1m 46s
4254:	learn: 0.0254490	total: 10m 5s	remaining: 1m 45s
4255:	learn: 0.0254471	total: 10m 5s	remaining: 1m 45s
4256:	learn: 0.0254431	total: 10m 5s	remaining: 1m 45s
4257:	learn: 0.0254412	total: 10m 5s	remaining: 1m 45s
4258:	learn: 0.0254185	total: 10m 5s	remaining: 1m 45s
4259:	learn: 0.0254133	total: 10m 5s	remaining: 1m 45s
4260:	learn: 0.0254113	total: 10m 5s	remaining: 1m 45s
4261:	learn: 0.0254095	total: 10m 6s	remaining: 1m 44s
4262:	learn: 0.0254015	total: 10m 6s	remaining: 1m 44s
4263:	learn: 0.0253909	total: 10m 6s	remaining: 1m 44s
4264:	learn: 0.0253890	total: 10m 6s	remaining: 1m 44s
4265:	learn: 0.0253856	total: 10m 6s	remaining: 1m 44s
4266:	learn: 0.0253773	total: 10m 6s	remaining: 1m 44s
4267:	learn: 0.0253754	total: 10m 6s	remaining: 1m 44s
4268:	learn: 0.0253519	total: 10m 7s	remaining: 1m 43s
4269:	lear

4399:	learn: 0.0245229	total: 10m 26s	remaining: 1m 25s
4400:	learn: 0.0245211	total: 10m 26s	remaining: 1m 25s
4401:	learn: 0.0245194	total: 10m 26s	remaining: 1m 25s
4402:	learn: 0.0244815	total: 10m 26s	remaining: 1m 24s
4403:	learn: 0.0244766	total: 10m 26s	remaining: 1m 24s
4404:	learn: 0.0244749	total: 10m 26s	remaining: 1m 24s
4405:	learn: 0.0244730	total: 10m 27s	remaining: 1m 24s
4406:	learn: 0.0244713	total: 10m 27s	remaining: 1m 24s
4407:	learn: 0.0244695	total: 10m 27s	remaining: 1m 24s
4408:	learn: 0.0244678	total: 10m 27s	remaining: 1m 24s
4409:	learn: 0.0244661	total: 10m 27s	remaining: 1m 23s
4410:	learn: 0.0244630	total: 10m 27s	remaining: 1m 23s
4411:	learn: 0.0244524	total: 10m 27s	remaining: 1m 23s
4412:	learn: 0.0244502	total: 10m 28s	remaining: 1m 23s
4413:	learn: 0.0244485	total: 10m 28s	remaining: 1m 23s
4414:	learn: 0.0244439	total: 10m 28s	remaining: 1m 23s
4415:	learn: 0.0244406	total: 10m 28s	remaining: 1m 23s
4416:	learn: 0.0244354	total: 10m 28s	remaining:

4546:	learn: 0.0236973	total: 10m 48s	remaining: 1m 4s
4547:	learn: 0.0236958	total: 10m 48s	remaining: 1m 4s
4548:	learn: 0.0236942	total: 10m 48s	remaining: 1m 4s
4549:	learn: 0.0236845	total: 10m 48s	remaining: 1m 4s
4550:	learn: 0.0236829	total: 10m 48s	remaining: 1m 4s
4551:	learn: 0.0236814	total: 10m 49s	remaining: 1m 3s
4552:	learn: 0.0236705	total: 10m 49s	remaining: 1m 3s
4553:	learn: 0.0236600	total: 10m 49s	remaining: 1m 3s
4554:	learn: 0.0236569	total: 10m 49s	remaining: 1m 3s
4555:	learn: 0.0236553	total: 10m 49s	remaining: 1m 3s
4556:	learn: 0.0236536	total: 10m 49s	remaining: 1m 3s
4557:	learn: 0.0236521	total: 10m 50s	remaining: 1m 3s
4558:	learn: 0.0236477	total: 10m 50s	remaining: 1m 2s
4559:	learn: 0.0236462	total: 10m 50s	remaining: 1m 2s
4560:	learn: 0.0236447	total: 10m 50s	remaining: 1m 2s
4561:	learn: 0.0236397	total: 10m 50s	remaining: 1m 2s
4562:	learn: 0.0236316	total: 10m 50s	remaining: 1m 2s
4563:	learn: 0.0236186	total: 10m 50s	remaining: 1m 2s
4564:	lear

4698:	learn: 0.0228594	total: 11m 10s	remaining: 43s
4699:	learn: 0.0228578	total: 11m 10s	remaining: 42.8s
4700:	learn: 0.0228563	total: 11m 11s	remaining: 42.7s
4701:	learn: 0.0228548	total: 11m 11s	remaining: 42.5s
4702:	learn: 0.0228471	total: 11m 11s	remaining: 42.4s
4703:	learn: 0.0228457	total: 11m 11s	remaining: 42.3s
4704:	learn: 0.0228356	total: 11m 11s	remaining: 42.1s
4705:	learn: 0.0228151	total: 11m 11s	remaining: 42s
4706:	learn: 0.0228119	total: 11m 12s	remaining: 41.8s
4707:	learn: 0.0228103	total: 11m 12s	remaining: 41.7s
4708:	learn: 0.0228088	total: 11m 12s	remaining: 41.6s
4709:	learn: 0.0228073	total: 11m 12s	remaining: 41.4s
4710:	learn: 0.0227807	total: 11m 12s	remaining: 41.3s
4711:	learn: 0.0227777	total: 11m 12s	remaining: 41.1s
4712:	learn: 0.0227761	total: 11m 12s	remaining: 41s
4713:	learn: 0.0227746	total: 11m 13s	remaining: 40.8s
4714:	learn: 0.0227704	total: 11m 13s	remaining: 40.7s
4715:	learn: 0.0227363	total: 11m 13s	remaining: 40.6s
4716:	learn: 0.0

4848:	learn: 0.0221193	total: 11m 32s	remaining: 21.6s
4849:	learn: 0.0221166	total: 11m 32s	remaining: 21.4s
4850:	learn: 0.0221069	total: 11m 32s	remaining: 21.3s
4851:	learn: 0.0221055	total: 11m 33s	remaining: 21.1s
4852:	learn: 0.0221017	total: 11m 33s	remaining: 21s
4853:	learn: 0.0221003	total: 11m 33s	remaining: 20.9s
4854:	learn: 0.0220989	total: 11m 33s	remaining: 20.7s
4855:	learn: 0.0220975	total: 11m 33s	remaining: 20.6s
4856:	learn: 0.0220906	total: 11m 33s	remaining: 20.4s
4857:	learn: 0.0220853	total: 11m 34s	remaining: 20.3s
4858:	learn: 0.0220711	total: 11m 34s	remaining: 20.1s
4859:	learn: 0.0220697	total: 11m 34s	remaining: 20s
4860:	learn: 0.0220526	total: 11m 34s	remaining: 19.9s
4861:	learn: 0.0220466	total: 11m 34s	remaining: 19.7s
4862:	learn: 0.0220452	total: 11m 34s	remaining: 19.6s
4863:	learn: 0.0220438	total: 11m 34s	remaining: 19.4s
4864:	learn: 0.0220425	total: 11m 35s	remaining: 19.3s
4865:	learn: 0.0220249	total: 11m 35s	remaining: 19.1s
4866:	learn: 0

4998:	learn: 0.0214478	total: 11m 55s	remaining: 143ms
4999:	learn: 0.0214465	total: 11m 55s	remaining: 0us


<catboost.core.CatBoostClassifier at 0x2986f83b790>

In [152]:
roc_auc_score(y_test, clf2.predict(X_test_vectorized))

0.9183173129294381

### LogisticRegression

In [141]:
clf3 = LogisticRegression()

In [142]:
clf3.fit(X_train_vectorized, y_train)

In [143]:
roc_auc_score(y_test, clf3.predict(X_test_vectorized))

0.9245921817855064

### Логистическая регрессия показала лучший результат, поэтому будем использовать ее для скоринга тестовых данных

In [147]:
test_vectorized = vectorizer.transform(test.text.to_list())

In [148]:
predictions = clf3.predict(test_vectorized)

In [154]:
score = pd.Series(predictions)

In [162]:
ans = pd.DataFrame(data = {'score': score, 'text': test.text}).to_csv('prediction.csv')