<h1>Table of Contents<span class="tocSkip"></span></h1>
<div class="toc"><ul class="toc-item"></ul></div>

In [1]:
import os
import json
import numpy as np
import pandas as pd
import random
import gymnasium as gym
import matplotlib.pyplot as plt
from matplotlib import animation
from catboost import CatBoostClassifier
from sklearn.model_selection import train_test_split
from IPython import display

In [2]:
data_directory = 'states'

In [4]:
X, y = [], []
for filename in os.listdir(data_directory):
    if not filename.startswith('expert') or not filename.endswith('.txt'):
        continue
    with open(f'{data_directory}/{filename}', 'r') as file:
        content = json.load(file)
        memory, action = zip(*content)
        X.extend(memory)
        y.extend(action)
X, y = pd.DataFrame(X), pd.DataFrame(y)

In [6]:
X_train, X_test, y_train, y_test = train_test_split(X, y, 
                                                    test_size=0.2, 
                                                    shuffle=True, 
                                                    stratify=y)

In [7]:
model = CatBoostClassifier(iterations=3500,
                           depth=8, 
                           verbose=True, 
                           loss_function='MultiClass',
                           learning_rate=4e-2)
model.fit(X_train, y_train, eval_set=(X_test, y_test), plot=True)

MetricVisualizer(layout=Layout(align_self='stretch', height='500px'))

0:	learn: 1.5535315	test: 1.5535604	best: 1.5535604 (0)	total: 297ms	remaining: 17m 19s
1:	learn: 1.5051943	test: 1.5051559	best: 1.5051559 (1)	total: 438ms	remaining: 12m 46s
2:	learn: 1.4624494	test: 1.4624346	best: 1.4624346 (2)	total: 570ms	remaining: 11m 4s
3:	learn: 1.4260472	test: 1.4262671	best: 1.4262671 (3)	total: 685ms	remaining: 9m 58s
4:	learn: 1.3916946	test: 1.3919706	best: 1.3919706 (4)	total: 803ms	remaining: 9m 21s
5:	learn: 1.3620930	test: 1.3626728	best: 1.3626728 (5)	total: 932ms	remaining: 9m 3s
6:	learn: 1.3347767	test: 1.3357992	best: 1.3357992 (6)	total: 1.14s	remaining: 9m 28s
7:	learn: 1.3095742	test: 1.3109374	best: 1.3109374 (7)	total: 1.27s	remaining: 9m 16s
8:	learn: 1.2861096	test: 1.2874044	best: 1.2874044 (8)	total: 1.43s	remaining: 9m 13s
9:	learn: 1.2653133	test: 1.2666526	best: 1.2666526 (9)	total: 1.57s	remaining: 9m 8s
10:	learn: 1.2450563	test: 1.2464744	best: 1.2464744 (10)	total: 1.72s	remaining: 9m 5s
11:	learn: 1.2258158	test: 1.2273298	best:

94:	learn: 0.8484372	test: 0.8719999	best: 0.8719999 (94)	total: 12.3s	remaining: 7m 19s
95:	learn: 0.8470711	test: 0.8708180	best: 0.8708180 (95)	total: 12.4s	remaining: 7m 19s
96:	learn: 0.8455711	test: 0.8697814	best: 0.8697814 (96)	total: 12.5s	remaining: 7m 19s
97:	learn: 0.8443054	test: 0.8687603	best: 0.8687603 (97)	total: 12.6s	remaining: 7m 18s
98:	learn: 0.8427933	test: 0.8676243	best: 0.8676243 (98)	total: 12.8s	remaining: 7m 18s
99:	learn: 0.8406203	test: 0.8658587	best: 0.8658587 (99)	total: 12.9s	remaining: 7m 17s
100:	learn: 0.8390231	test: 0.8646142	best: 0.8646142 (100)	total: 13s	remaining: 7m 17s
101:	learn: 0.8370993	test: 0.8630254	best: 0.8630254 (101)	total: 13.1s	remaining: 7m 16s
102:	learn: 0.8354825	test: 0.8616990	best: 0.8616990 (102)	total: 13.2s	remaining: 7m 16s
103:	learn: 0.8336436	test: 0.8601868	best: 0.8601868 (103)	total: 13.4s	remaining: 7m 16s
104:	learn: 0.8326561	test: 0.8594587	best: 0.8594587 (104)	total: 13.5s	remaining: 7m 16s
105:	learn: 0

186:	learn: 0.7385472	test: 0.7879351	best: 0.7879351 (186)	total: 23.7s	remaining: 7m
187:	learn: 0.7380967	test: 0.7876134	best: 0.7876134 (187)	total: 23.8s	remaining: 7m
188:	learn: 0.7373793	test: 0.7870231	best: 0.7870231 (188)	total: 24s	remaining: 6m 59s
189:	learn: 0.7364180	test: 0.7863184	best: 0.7863184 (189)	total: 24.1s	remaining: 6m 59s
190:	learn: 0.7356752	test: 0.7857652	best: 0.7857652 (190)	total: 24.2s	remaining: 6m 59s
191:	learn: 0.7348372	test: 0.7851284	best: 0.7851284 (191)	total: 24.3s	remaining: 6m 59s
192:	learn: 0.7334532	test: 0.7840412	best: 0.7840412 (192)	total: 24.4s	remaining: 6m 58s
193:	learn: 0.7328157	test: 0.7834946	best: 0.7834946 (193)	total: 24.6s	remaining: 6m 58s
194:	learn: 0.7320541	test: 0.7829065	best: 0.7829065 (194)	total: 24.7s	remaining: 6m 58s
195:	learn: 0.7315513	test: 0.7825178	best: 0.7825178 (195)	total: 24.8s	remaining: 6m 58s
196:	learn: 0.7307002	test: 0.7819944	best: 0.7819944 (196)	total: 24.9s	remaining: 6m 57s
197:	lear

278:	learn: 0.6764161	test: 0.7438762	best: 0.7438762 (278)	total: 35s	remaining: 6m 43s
279:	learn: 0.6758504	test: 0.7435543	best: 0.7435543 (279)	total: 35.1s	remaining: 6m 43s
280:	learn: 0.6754399	test: 0.7432379	best: 0.7432379 (280)	total: 35.2s	remaining: 6m 43s
281:	learn: 0.6749555	test: 0.7428988	best: 0.7428988 (281)	total: 35.4s	remaining: 6m 43s
282:	learn: 0.6742319	test: 0.7424376	best: 0.7424376 (282)	total: 35.5s	remaining: 6m 43s
283:	learn: 0.6736366	test: 0.7419610	best: 0.7419610 (283)	total: 35.6s	remaining: 6m 43s
284:	learn: 0.6729206	test: 0.7414181	best: 0.7414181 (284)	total: 35.8s	remaining: 6m 43s
285:	learn: 0.6725683	test: 0.7411596	best: 0.7411596 (285)	total: 35.9s	remaining: 6m 43s
286:	learn: 0.6719978	test: 0.7406761	best: 0.7406761 (286)	total: 36s	remaining: 6m 43s
287:	learn: 0.6715580	test: 0.7403764	best: 0.7403764 (287)	total: 36.2s	remaining: 6m 43s
288:	learn: 0.6711631	test: 0.7401368	best: 0.7401368 (288)	total: 36.3s	remaining: 6m 43s
289

370:	learn: 0.6306458	test: 0.7132605	best: 0.7132605 (370)	total: 46.2s	remaining: 6m 29s
371:	learn: 0.6302408	test: 0.7130508	best: 0.7130508 (371)	total: 46.3s	remaining: 6m 29s
372:	learn: 0.6298964	test: 0.7128675	best: 0.7128675 (372)	total: 46.4s	remaining: 6m 29s
373:	learn: 0.6294693	test: 0.7125910	best: 0.7125910 (373)	total: 46.5s	remaining: 6m 28s
374:	learn: 0.6290739	test: 0.7122733	best: 0.7122733 (374)	total: 46.6s	remaining: 6m 28s
375:	learn: 0.6282645	test: 0.7116688	best: 0.7116688 (375)	total: 46.8s	remaining: 6m 28s
376:	learn: 0.6279478	test: 0.7115041	best: 0.7115041 (376)	total: 46.9s	remaining: 6m 28s
377:	learn: 0.6274938	test: 0.7111793	best: 0.7111793 (377)	total: 47s	remaining: 6m 28s
378:	learn: 0.6272189	test: 0.7110253	best: 0.7110253 (378)	total: 47.1s	remaining: 6m 27s
379:	learn: 0.6266846	test: 0.7104878	best: 0.7104878 (379)	total: 47.2s	remaining: 6m 27s
380:	learn: 0.6263740	test: 0.7101988	best: 0.7101988 (380)	total: 47.3s	remaining: 6m 27s
3

462:	learn: 0.5929428	test: 0.6887078	best: 0.6887078 (462)	total: 57.6s	remaining: 6m 17s
463:	learn: 0.5924256	test: 0.6884472	best: 0.6884472 (463)	total: 57.7s	remaining: 6m 17s
464:	learn: 0.5918588	test: 0.6880125	best: 0.6880125 (464)	total: 57.8s	remaining: 6m 17s
465:	learn: 0.5915669	test: 0.6878577	best: 0.6878577 (465)	total: 57.9s	remaining: 6m 17s
466:	learn: 0.5912966	test: 0.6876333	best: 0.6876333 (466)	total: 58s	remaining: 6m 16s
467:	learn: 0.5910091	test: 0.6874297	best: 0.6874297 (467)	total: 58.2s	remaining: 6m 16s
468:	learn: 0.5904540	test: 0.6871080	best: 0.6871080 (468)	total: 58.3s	remaining: 6m 16s
469:	learn: 0.5904042	test: 0.6870983	best: 0.6870983 (469)	total: 58.3s	remaining: 6m 16s
470:	learn: 0.5900970	test: 0.6868429	best: 0.6868429 (470)	total: 58.4s	remaining: 6m 15s
471:	learn: 0.5895009	test: 0.6863248	best: 0.6863248 (471)	total: 58.6s	remaining: 6m 15s
472:	learn: 0.5892515	test: 0.6861086	best: 0.6861086 (472)	total: 58.7s	remaining: 6m 15s
4

553:	learn: 0.5612946	test: 0.6686893	best: 0.6686893 (553)	total: 1m 8s	remaining: 6m 5s
554:	learn: 0.5610832	test: 0.6685596	best: 0.6685596 (554)	total: 1m 8s	remaining: 6m 5s
555:	learn: 0.5608530	test: 0.6683667	best: 0.6683667 (555)	total: 1m 8s	remaining: 6m 5s
556:	learn: 0.5603956	test: 0.6680499	best: 0.6680499 (556)	total: 1m 9s	remaining: 6m 5s
557:	learn: 0.5600102	test: 0.6678999	best: 0.6678999 (557)	total: 1m 9s	remaining: 6m 4s
558:	learn: 0.5598418	test: 0.6678289	best: 0.6678289 (558)	total: 1m 9s	remaining: 6m 4s
559:	learn: 0.5594889	test: 0.6676695	best: 0.6676695 (559)	total: 1m 9s	remaining: 6m 4s
560:	learn: 0.5592104	test: 0.6674962	best: 0.6674962 (560)	total: 1m 9s	remaining: 6m 4s
561:	learn: 0.5589034	test: 0.6673513	best: 0.6673513 (561)	total: 1m 9s	remaining: 6m 4s
562:	learn: 0.5587329	test: 0.6672847	best: 0.6672847 (562)	total: 1m 9s	remaining: 6m 4s
563:	learn: 0.5583598	test: 0.6669988	best: 0.6669988 (563)	total: 1m 9s	remaining: 6m 4s
564:	learn

643:	learn: 0.5364099	test: 0.6542720	best: 0.6542720 (643)	total: 1m 19s	remaining: 5m 52s
644:	learn: 0.5361128	test: 0.6541359	best: 0.6541359 (644)	total: 1m 19s	remaining: 5m 52s
645:	learn: 0.5357365	test: 0.6538919	best: 0.6538919 (645)	total: 1m 19s	remaining: 5m 52s
646:	learn: 0.5354977	test: 0.6537920	best: 0.6537920 (646)	total: 1m 19s	remaining: 5m 52s
647:	learn: 0.5350981	test: 0.6534905	best: 0.6534905 (647)	total: 1m 20s	remaining: 5m 52s
648:	learn: 0.5348381	test: 0.6533516	best: 0.6533516 (648)	total: 1m 20s	remaining: 5m 52s
649:	learn: 0.5345902	test: 0.6532768	best: 0.6532768 (649)	total: 1m 20s	remaining: 5m 51s
650:	learn: 0.5342904	test: 0.6531039	best: 0.6531039 (650)	total: 1m 20s	remaining: 5m 51s
651:	learn: 0.5338472	test: 0.6528024	best: 0.6528024 (651)	total: 1m 20s	remaining: 5m 51s
652:	learn: 0.5336648	test: 0.6527125	best: 0.6527125 (652)	total: 1m 20s	remaining: 5m 51s
653:	learn: 0.5334680	test: 0.6526629	best: 0.6526629 (653)	total: 1m 20s	remain

733:	learn: 0.5151655	test: 0.6424975	best: 0.6424975 (733)	total: 1m 30s	remaining: 5m 41s
734:	learn: 0.5149823	test: 0.6424365	best: 0.6424365 (734)	total: 1m 30s	remaining: 5m 41s
735:	learn: 0.5148581	test: 0.6423654	best: 0.6423654 (735)	total: 1m 30s	remaining: 5m 41s
736:	learn: 0.5144626	test: 0.6421409	best: 0.6421409 (736)	total: 1m 31s	remaining: 5m 41s
737:	learn: 0.5142913	test: 0.6420274	best: 0.6420274 (737)	total: 1m 31s	remaining: 5m 41s
738:	learn: 0.5140833	test: 0.6418460	best: 0.6418460 (738)	total: 1m 31s	remaining: 5m 40s
739:	learn: 0.5138693	test: 0.6416980	best: 0.6416980 (739)	total: 1m 31s	remaining: 5m 40s
740:	learn: 0.5137108	test: 0.6416719	best: 0.6416719 (740)	total: 1m 31s	remaining: 5m 40s
741:	learn: 0.5136295	test: 0.6416149	best: 0.6416149 (741)	total: 1m 31s	remaining: 5m 40s
742:	learn: 0.5134249	test: 0.6416180	best: 0.6416149 (741)	total: 1m 31s	remaining: 5m 40s
743:	learn: 0.5132453	test: 0.6415111	best: 0.6415111 (743)	total: 1m 31s	remain

823:	learn: 0.4963901	test: 0.6325873	best: 0.6325873 (823)	total: 1m 41s	remaining: 5m 30s
824:	learn: 0.4963013	test: 0.6325453	best: 0.6325453 (824)	total: 1m 41s	remaining: 5m 30s
825:	learn: 0.4961296	test: 0.6324269	best: 0.6324269 (825)	total: 1m 42s	remaining: 5m 30s
826:	learn: 0.4960086	test: 0.6323641	best: 0.6323641 (826)	total: 1m 42s	remaining: 5m 30s
827:	learn: 0.4959619	test: 0.6323733	best: 0.6323641 (826)	total: 1m 42s	remaining: 5m 30s
828:	learn: 0.4957809	test: 0.6322882	best: 0.6322882 (828)	total: 1m 42s	remaining: 5m 30s
829:	learn: 0.4956272	test: 0.6322435	best: 0.6322435 (829)	total: 1m 42s	remaining: 5m 29s
830:	learn: 0.4954834	test: 0.6321279	best: 0.6321279 (830)	total: 1m 42s	remaining: 5m 29s
831:	learn: 0.4952992	test: 0.6320787	best: 0.6320787 (831)	total: 1m 42s	remaining: 5m 29s
832:	learn: 0.4952205	test: 0.6320550	best: 0.6320550 (832)	total: 1m 42s	remaining: 5m 29s
833:	learn: 0.4948857	test: 0.6318926	best: 0.6318926 (833)	total: 1m 43s	remain

913:	learn: 0.4793599	test: 0.6236269	best: 0.6236269 (913)	total: 1m 52s	remaining: 5m 19s
914:	learn: 0.4791718	test: 0.6235654	best: 0.6235654 (914)	total: 1m 52s	remaining: 5m 18s
915:	learn: 0.4789442	test: 0.6234805	best: 0.6234805 (915)	total: 1m 53s	remaining: 5m 18s
916:	learn: 0.4786795	test: 0.6234073	best: 0.6234073 (916)	total: 1m 53s	remaining: 5m 18s
917:	learn: 0.4785264	test: 0.6233262	best: 0.6233262 (917)	total: 1m 53s	remaining: 5m 18s
918:	learn: 0.4784574	test: 0.6233002	best: 0.6233002 (918)	total: 1m 53s	remaining: 5m 18s
919:	learn: 0.4782375	test: 0.6232042	best: 0.6232042 (919)	total: 1m 53s	remaining: 5m 18s
920:	learn: 0.4780232	test: 0.6230671	best: 0.6230671 (920)	total: 1m 53s	remaining: 5m 18s
921:	learn: 0.4777518	test: 0.6229313	best: 0.6229313 (921)	total: 1m 53s	remaining: 5m 18s
922:	learn: 0.4776806	test: 0.6229246	best: 0.6229246 (922)	total: 1m 53s	remaining: 5m 18s
923:	learn: 0.4773287	test: 0.6227460	best: 0.6227460 (923)	total: 1m 54s	remain

1004:	learn: 0.4646069	test: 0.6164162	best: 0.6164162 (1004)	total: 2m 4s	remaining: 5m 7s
1005:	learn: 0.4642717	test: 0.6161476	best: 0.6161476 (1005)	total: 2m 4s	remaining: 5m 7s
1006:	learn: 0.4640409	test: 0.6160386	best: 0.6160386 (1006)	total: 2m 4s	remaining: 5m 7s
1007:	learn: 0.4638775	test: 0.6159495	best: 0.6159495 (1007)	total: 2m 4s	remaining: 5m 7s
1008:	learn: 0.4635658	test: 0.6158422	best: 0.6158422 (1008)	total: 2m 4s	remaining: 5m 7s
1009:	learn: 0.4634019	test: 0.6157816	best: 0.6157816 (1009)	total: 2m 4s	remaining: 5m 7s
1010:	learn: 0.4632291	test: 0.6157070	best: 0.6157070 (1010)	total: 2m 4s	remaining: 5m 7s
1011:	learn: 0.4631274	test: 0.6156480	best: 0.6156480 (1011)	total: 2m 4s	remaining: 5m 6s
1012:	learn: 0.4628190	test: 0.6154892	best: 0.6154892 (1012)	total: 2m 4s	remaining: 5m 6s
1013:	learn: 0.4626690	test: 0.6154061	best: 0.6154061 (1013)	total: 2m 5s	remaining: 5m 6s
1014:	learn: 0.4624927	test: 0.6153104	best: 0.6153104 (1014)	total: 2m 5s	remai

1094:	learn: 0.4497070	test: 0.6092109	best: 0.6092109 (1094)	total: 2m 15s	remaining: 4m 57s
1095:	learn: 0.4495158	test: 0.6091498	best: 0.6091498 (1095)	total: 2m 15s	remaining: 4m 56s
1096:	learn: 0.4493723	test: 0.6090721	best: 0.6090721 (1096)	total: 2m 15s	remaining: 4m 56s
1097:	learn: 0.4491913	test: 0.6089703	best: 0.6089703 (1097)	total: 2m 15s	remaining: 4m 56s
1098:	learn: 0.4490057	test: 0.6088330	best: 0.6088330 (1098)	total: 2m 15s	remaining: 4m 56s
1099:	learn: 0.4488515	test: 0.6087738	best: 0.6087738 (1099)	total: 2m 15s	remaining: 4m 56s
1100:	learn: 0.4486040	test: 0.6085968	best: 0.6085968 (1100)	total: 2m 15s	remaining: 4m 56s
1101:	learn: 0.4484575	test: 0.6084925	best: 0.6084925 (1101)	total: 2m 16s	remaining: 4m 56s
1102:	learn: 0.4483663	test: 0.6084417	best: 0.6084417 (1102)	total: 2m 16s	remaining: 4m 55s
1103:	learn: 0.4481939	test: 0.6082935	best: 0.6082935 (1103)	total: 2m 16s	remaining: 4m 55s
1104:	learn: 0.4480808	test: 0.6082074	best: 0.6082074 (1104

1182:	learn: 0.4365922	test: 0.6027828	best: 0.6027828 (1182)	total: 2m 26s	remaining: 4m 45s
1183:	learn: 0.4363913	test: 0.6027003	best: 0.6027003 (1183)	total: 2m 26s	remaining: 4m 45s
1184:	learn: 0.4362461	test: 0.6027244	best: 0.6027003 (1183)	total: 2m 26s	remaining: 4m 45s
1185:	learn: 0.4360625	test: 0.6026166	best: 0.6026166 (1185)	total: 2m 26s	remaining: 4m 45s
1186:	learn: 0.4359670	test: 0.6025593	best: 0.6025593 (1186)	total: 2m 26s	remaining: 4m 45s
1187:	learn: 0.4358415	test: 0.6024751	best: 0.6024751 (1187)	total: 2m 26s	remaining: 4m 45s
1188:	learn: 0.4356425	test: 0.6023559	best: 0.6023559 (1188)	total: 2m 26s	remaining: 4m 45s
1189:	learn: 0.4355255	test: 0.6022821	best: 0.6022821 (1189)	total: 2m 26s	remaining: 4m 45s
1190:	learn: 0.4354051	test: 0.6022937	best: 0.6022821 (1189)	total: 2m 27s	remaining: 4m 45s
1191:	learn: 0.4353363	test: 0.6022455	best: 0.6022455 (1191)	total: 2m 27s	remaining: 4m 45s
1192:	learn: 0.4351306	test: 0.6021718	best: 0.6021718 (1192

1270:	learn: 0.4248233	test: 0.5974203	best: 0.5974203 (1270)	total: 2m 36s	remaining: 4m 35s
1271:	learn: 0.4247706	test: 0.5973891	best: 0.5973891 (1271)	total: 2m 37s	remaining: 4m 35s
1272:	learn: 0.4245881	test: 0.5973134	best: 0.5973134 (1272)	total: 2m 37s	remaining: 4m 34s
1273:	learn: 0.4244515	test: 0.5972861	best: 0.5972861 (1273)	total: 2m 37s	remaining: 4m 34s
1274:	learn: 0.4243501	test: 0.5972482	best: 0.5972482 (1274)	total: 2m 37s	remaining: 4m 34s
1275:	learn: 0.4241623	test: 0.5972473	best: 0.5972473 (1275)	total: 2m 37s	remaining: 4m 34s
1276:	learn: 0.4240439	test: 0.5972169	best: 0.5972169 (1276)	total: 2m 37s	remaining: 4m 34s
1277:	learn: 0.4238877	test: 0.5971750	best: 0.5971750 (1277)	total: 2m 37s	remaining: 4m 34s
1278:	learn: 0.4238176	test: 0.5971351	best: 0.5971351 (1278)	total: 2m 37s	remaining: 4m 34s
1279:	learn: 0.4237641	test: 0.5971451	best: 0.5971351 (1278)	total: 2m 37s	remaining: 4m 34s
1280:	learn: 0.4236389	test: 0.5971104	best: 0.5971104 (1280

1358:	learn: 0.4139140	test: 0.5931864	best: 0.5931864 (1358)	total: 2m 47s	remaining: 4m 24s
1359:	learn: 0.4137589	test: 0.5930736	best: 0.5930736 (1359)	total: 2m 48s	remaining: 4m 24s
1360:	learn: 0.4136810	test: 0.5930578	best: 0.5930578 (1360)	total: 2m 48s	remaining: 4m 24s
1361:	learn: 0.4135776	test: 0.5929824	best: 0.5929824 (1361)	total: 2m 48s	remaining: 4m 24s
1362:	learn: 0.4134463	test: 0.5929459	best: 0.5929459 (1362)	total: 2m 48s	remaining: 4m 24s
1363:	learn: 0.4133306	test: 0.5928767	best: 0.5928767 (1363)	total: 2m 48s	remaining: 4m 23s
1364:	learn: 0.4132433	test: 0.5928238	best: 0.5928238 (1364)	total: 2m 48s	remaining: 4m 23s
1365:	learn: 0.4130798	test: 0.5928141	best: 0.5928141 (1365)	total: 2m 48s	remaining: 4m 23s
1366:	learn: 0.4130430	test: 0.5928221	best: 0.5928141 (1365)	total: 2m 48s	remaining: 4m 23s
1367:	learn: 0.4129348	test: 0.5927296	best: 0.5927296 (1367)	total: 2m 49s	remaining: 4m 23s
1368:	learn: 0.4127706	test: 0.5926160	best: 0.5926160 (1368

1447:	learn: 0.4030756	test: 0.5885734	best: 0.5885734 (1447)	total: 2m 59s	remaining: 4m 13s
1448:	learn: 0.4029883	test: 0.5885257	best: 0.5885257 (1448)	total: 2m 59s	remaining: 4m 13s
1449:	learn: 0.4028241	test: 0.5884764	best: 0.5884764 (1449)	total: 2m 59s	remaining: 4m 13s
1450:	learn: 0.4027667	test: 0.5884798	best: 0.5884764 (1449)	total: 2m 59s	remaining: 4m 13s
1451:	learn: 0.4026909	test: 0.5884648	best: 0.5884648 (1451)	total: 2m 59s	remaining: 4m 13s
1452:	learn: 0.4025596	test: 0.5883939	best: 0.5883939 (1452)	total: 2m 59s	remaining: 4m 13s
1453:	learn: 0.4024658	test: 0.5883559	best: 0.5883559 (1453)	total: 2m 59s	remaining: 4m 13s
1454:	learn: 0.4023590	test: 0.5883055	best: 0.5883055 (1454)	total: 3m	remaining: 4m 13s
1455:	learn: 0.4021592	test: 0.5882899	best: 0.5882899 (1455)	total: 3m	remaining: 4m 12s
1456:	learn: 0.4019259	test: 0.5882687	best: 0.5882687 (1456)	total: 3m	remaining: 4m 12s
1457:	learn: 0.4018045	test: 0.5882444	best: 0.5882444 (1457)	total: 3m	

1536:	learn: 0.3923247	test: 0.5846319	best: 0.5846319 (1536)	total: 3m 10s	remaining: 4m 2s
1537:	learn: 0.3922834	test: 0.5846453	best: 0.5846319 (1536)	total: 3m 10s	remaining: 4m 2s
1538:	learn: 0.3921211	test: 0.5846201	best: 0.5846201 (1538)	total: 3m 10s	remaining: 4m 2s
1539:	learn: 0.3920339	test: 0.5845960	best: 0.5845960 (1539)	total: 3m 10s	remaining: 4m 2s
1540:	learn: 0.3918763	test: 0.5845202	best: 0.5845202 (1540)	total: 3m 10s	remaining: 4m 2s
1541:	learn: 0.3918205	test: 0.5844988	best: 0.5844988 (1541)	total: 3m 10s	remaining: 4m 2s
1542:	learn: 0.3917483	test: 0.5844920	best: 0.5844920 (1542)	total: 3m 10s	remaining: 4m 2s
1543:	learn: 0.3916942	test: 0.5844999	best: 0.5844920 (1542)	total: 3m 10s	remaining: 4m 1s
1544:	learn: 0.3914858	test: 0.5843667	best: 0.5843667 (1544)	total: 3m 11s	remaining: 4m 1s
1545:	learn: 0.3914464	test: 0.5843636	best: 0.5843636 (1545)	total: 3m 11s	remaining: 4m 1s
1546:	learn: 0.3914021	test: 0.5843280	best: 0.5843280 (1546)	total: 3

1624:	learn: 0.3838994	test: 0.5815706	best: 0.5815706 (1624)	total: 3m 21s	remaining: 3m 52s
1625:	learn: 0.3837311	test: 0.5814875	best: 0.5814875 (1625)	total: 3m 21s	remaining: 3m 51s
1626:	learn: 0.3836503	test: 0.5814560	best: 0.5814560 (1626)	total: 3m 21s	remaining: 3m 51s
1627:	learn: 0.3835213	test: 0.5813841	best: 0.5813841 (1627)	total: 3m 21s	remaining: 3m 51s
1628:	learn: 0.3834472	test: 0.5813760	best: 0.5813760 (1628)	total: 3m 21s	remaining: 3m 51s
1629:	learn: 0.3833720	test: 0.5813234	best: 0.5813234 (1629)	total: 3m 21s	remaining: 3m 51s
1630:	learn: 0.3833281	test: 0.5813110	best: 0.5813110 (1630)	total: 3m 21s	remaining: 3m 51s
1631:	learn: 0.3833012	test: 0.5812942	best: 0.5812942 (1631)	total: 3m 22s	remaining: 3m 51s
1632:	learn: 0.3832150	test: 0.5812983	best: 0.5812942 (1631)	total: 3m 22s	remaining: 3m 51s
1633:	learn: 0.3831843	test: 0.5813055	best: 0.5812942 (1631)	total: 3m 22s	remaining: 3m 50s
1634:	learn: 0.3831030	test: 0.5812449	best: 0.5812449 (1634

1712:	learn: 0.3756797	test: 0.5784434	best: 0.5784434 (1712)	total: 3m 32s	remaining: 3m 41s
1713:	learn: 0.3756285	test: 0.5784282	best: 0.5784282 (1713)	total: 3m 32s	remaining: 3m 41s
1714:	learn: 0.3755706	test: 0.5784119	best: 0.5784119 (1714)	total: 3m 32s	remaining: 3m 41s
1715:	learn: 0.3755051	test: 0.5783816	best: 0.5783816 (1715)	total: 3m 32s	remaining: 3m 40s
1716:	learn: 0.3754354	test: 0.5783714	best: 0.5783714 (1716)	total: 3m 32s	remaining: 3m 40s
1717:	learn: 0.3753436	test: 0.5783438	best: 0.5783438 (1717)	total: 3m 32s	remaining: 3m 40s
1718:	learn: 0.3752842	test: 0.5783228	best: 0.5783228 (1718)	total: 3m 32s	remaining: 3m 40s
1719:	learn: 0.3751288	test: 0.5782905	best: 0.5782905 (1719)	total: 3m 33s	remaining: 3m 40s
1720:	learn: 0.3751008	test: 0.5783064	best: 0.5782905 (1719)	total: 3m 33s	remaining: 3m 40s
1721:	learn: 0.3750472	test: 0.5783129	best: 0.5782905 (1719)	total: 3m 33s	remaining: 3m 40s
1722:	learn: 0.3749847	test: 0.5783095	best: 0.5782905 (1719

1800:	learn: 0.3678796	test: 0.5755706	best: 0.5755706 (1800)	total: 3m 42s	remaining: 3m 30s
1801:	learn: 0.3678144	test: 0.5755417	best: 0.5755417 (1801)	total: 3m 43s	remaining: 3m 30s
1802:	learn: 0.3677800	test: 0.5755464	best: 0.5755417 (1801)	total: 3m 43s	remaining: 3m 30s
1803:	learn: 0.3676362	test: 0.5755305	best: 0.5755305 (1803)	total: 3m 43s	remaining: 3m 29s
1804:	learn: 0.3675063	test: 0.5754848	best: 0.5754848 (1804)	total: 3m 43s	remaining: 3m 29s
1805:	learn: 0.3674725	test: 0.5754937	best: 0.5754848 (1804)	total: 3m 43s	remaining: 3m 29s
1806:	learn: 0.3674089	test: 0.5754901	best: 0.5754848 (1804)	total: 3m 43s	remaining: 3m 29s
1807:	learn: 0.3673722	test: 0.5754936	best: 0.5754848 (1804)	total: 3m 43s	remaining: 3m 29s
1808:	learn: 0.3673234	test: 0.5754903	best: 0.5754848 (1804)	total: 3m 44s	remaining: 3m 29s
1809:	learn: 0.3672336	test: 0.5754565	best: 0.5754565 (1809)	total: 3m 44s	remaining: 3m 29s
1810:	learn: 0.3671859	test: 0.5754486	best: 0.5754486 (1810

1888:	learn: 0.3604722	test: 0.5730575	best: 0.5730575 (1888)	total: 3m 54s	remaining: 3m 19s
1889:	learn: 0.3604242	test: 0.5730773	best: 0.5730575 (1888)	total: 3m 54s	remaining: 3m 19s
1890:	learn: 0.3603587	test: 0.5730820	best: 0.5730575 (1888)	total: 3m 54s	remaining: 3m 19s
1891:	learn: 0.3602194	test: 0.5730090	best: 0.5730090 (1891)	total: 3m 54s	remaining: 3m 19s
1892:	learn: 0.3601721	test: 0.5729750	best: 0.5729750 (1892)	total: 3m 54s	remaining: 3m 19s
1893:	learn: 0.3601631	test: 0.5729711	best: 0.5729711 (1893)	total: 3m 54s	remaining: 3m 18s
1894:	learn: 0.3601517	test: 0.5729730	best: 0.5729711 (1893)	total: 3m 54s	remaining: 3m 18s
1895:	learn: 0.3601000	test: 0.5729811	best: 0.5729711 (1893)	total: 3m 54s	remaining: 3m 18s
1896:	learn: 0.3600113	test: 0.5729422	best: 0.5729422 (1896)	total: 3m 55s	remaining: 3m 18s
1897:	learn: 0.3599549	test: 0.5729350	best: 0.5729350 (1897)	total: 3m 55s	remaining: 3m 18s
1898:	learn: 0.3599087	test: 0.5729169	best: 0.5729169 (1898

1976:	learn: 0.3536221	test: 0.5707750	best: 0.5707670 (1975)	total: 4m 5s	remaining: 3m 8s
1977:	learn: 0.3535579	test: 0.5707451	best: 0.5707451 (1977)	total: 4m 5s	remaining: 3m 8s
1978:	learn: 0.3534910	test: 0.5707369	best: 0.5707369 (1978)	total: 4m 5s	remaining: 3m 8s
1979:	learn: 0.3534121	test: 0.5706893	best: 0.5706893 (1979)	total: 4m 5s	remaining: 3m 8s
1980:	learn: 0.3533504	test: 0.5706872	best: 0.5706872 (1980)	total: 4m 5s	remaining: 3m 8s
1981:	learn: 0.3532074	test: 0.5706798	best: 0.5706798 (1981)	total: 4m 5s	remaining: 3m 8s
1982:	learn: 0.3531430	test: 0.5706718	best: 0.5706718 (1982)	total: 4m 5s	remaining: 3m 8s
1983:	learn: 0.3530373	test: 0.5706331	best: 0.5706331 (1983)	total: 4m 6s	remaining: 3m 7s
1984:	learn: 0.3529346	test: 0.5705746	best: 0.5705746 (1984)	total: 4m 6s	remaining: 3m 7s
1985:	learn: 0.3529067	test: 0.5705431	best: 0.5705431 (1985)	total: 4m 6s	remaining: 3m 7s
1986:	learn: 0.3528806	test: 0.5705322	best: 0.5705322 (1986)	total: 4m 6s	remai

2065:	learn: 0.3464773	test: 0.5685777	best: 0.5685744 (2064)	total: 4m 16s	remaining: 2m 57s
2066:	learn: 0.3464336	test: 0.5685965	best: 0.5685744 (2064)	total: 4m 16s	remaining: 2m 57s
2067:	learn: 0.3463559	test: 0.5686254	best: 0.5685744 (2064)	total: 4m 16s	remaining: 2m 57s
2068:	learn: 0.3463370	test: 0.5686223	best: 0.5685744 (2064)	total: 4m 16s	remaining: 2m 57s
2069:	learn: 0.3463125	test: 0.5686261	best: 0.5685744 (2064)	total: 4m 16s	remaining: 2m 57s
2070:	learn: 0.3462571	test: 0.5685942	best: 0.5685744 (2064)	total: 4m 16s	remaining: 2m 57s
2071:	learn: 0.3461251	test: 0.5685355	best: 0.5685355 (2071)	total: 4m 16s	remaining: 2m 57s
2072:	learn: 0.3460707	test: 0.5685208	best: 0.5685208 (2072)	total: 4m 17s	remaining: 2m 56s
2073:	learn: 0.3460160	test: 0.5684951	best: 0.5684951 (2073)	total: 4m 17s	remaining: 2m 56s
2074:	learn: 0.3459517	test: 0.5684799	best: 0.5684799 (2074)	total: 4m 17s	remaining: 2m 56s
2075:	learn: 0.3459222	test: 0.5684684	best: 0.5684684 (2075

2153:	learn: 0.3402201	test: 0.5666683	best: 0.5666683 (2153)	total: 4m 27s	remaining: 2m 47s
2154:	learn: 0.3401789	test: 0.5666572	best: 0.5666572 (2154)	total: 4m 27s	remaining: 2m 47s
2155:	learn: 0.3401710	test: 0.5666734	best: 0.5666572 (2154)	total: 4m 28s	remaining: 2m 47s
2156:	learn: 0.3401170	test: 0.5666306	best: 0.5666306 (2156)	total: 4m 28s	remaining: 2m 46s
2157:	learn: 0.3400179	test: 0.5665980	best: 0.5665980 (2157)	total: 4m 28s	remaining: 2m 46s
2158:	learn: 0.3399494	test: 0.5666155	best: 0.5665980 (2157)	total: 4m 28s	remaining: 2m 46s
2159:	learn: 0.3398693	test: 0.5665365	best: 0.5665365 (2159)	total: 4m 28s	remaining: 2m 46s
2160:	learn: 0.3397456	test: 0.5664601	best: 0.5664601 (2160)	total: 4m 28s	remaining: 2m 46s
2161:	learn: 0.3397272	test: 0.5664717	best: 0.5664601 (2160)	total: 4m 28s	remaining: 2m 46s
2162:	learn: 0.3396363	test: 0.5664013	best: 0.5664013 (2162)	total: 4m 28s	remaining: 2m 46s
2163:	learn: 0.3395745	test: 0.5663891	best: 0.5663891 (2163

2242:	learn: 0.3347933	test: 0.5648659	best: 0.5648523 (2241)	total: 4m 38s	remaining: 2m 36s
2243:	learn: 0.3347135	test: 0.5648446	best: 0.5648446 (2243)	total: 4m 39s	remaining: 2m 36s
2244:	learn: 0.3346896	test: 0.5648509	best: 0.5648446 (2243)	total: 4m 39s	remaining: 2m 36s
2245:	learn: 0.3345805	test: 0.5647560	best: 0.5647560 (2245)	total: 4m 39s	remaining: 2m 35s
2246:	learn: 0.3345403	test: 0.5647643	best: 0.5647560 (2245)	total: 4m 39s	remaining: 2m 35s
2247:	learn: 0.3344763	test: 0.5647580	best: 0.5647560 (2245)	total: 4m 39s	remaining: 2m 35s
2248:	learn: 0.3344614	test: 0.5647624	best: 0.5647560 (2245)	total: 4m 39s	remaining: 2m 35s
2249:	learn: 0.3343667	test: 0.5647086	best: 0.5647086 (2249)	total: 4m 39s	remaining: 2m 35s
2250:	learn: 0.3342580	test: 0.5646563	best: 0.5646563 (2250)	total: 4m 39s	remaining: 2m 35s
2251:	learn: 0.3341654	test: 0.5646638	best: 0.5646563 (2250)	total: 4m 40s	remaining: 2m 35s
2252:	learn: 0.3340886	test: 0.5646236	best: 0.5646236 (2252

2330:	learn: 0.3293501	test: 0.5630643	best: 0.5630643 (2330)	total: 4m 49s	remaining: 2m 25s
2331:	learn: 0.3293248	test: 0.5630721	best: 0.5630643 (2330)	total: 4m 50s	remaining: 2m 25s
2332:	learn: 0.3292437	test: 0.5630727	best: 0.5630643 (2330)	total: 4m 50s	remaining: 2m 25s
2333:	learn: 0.3291861	test: 0.5631064	best: 0.5630643 (2330)	total: 4m 50s	remaining: 2m 25s
2334:	learn: 0.3290965	test: 0.5630656	best: 0.5630643 (2330)	total: 4m 50s	remaining: 2m 24s
2335:	learn: 0.3290103	test: 0.5630635	best: 0.5630635 (2335)	total: 4m 50s	remaining: 2m 24s
2336:	learn: 0.3289763	test: 0.5630607	best: 0.5630607 (2336)	total: 4m 50s	remaining: 2m 24s
2337:	learn: 0.3289424	test: 0.5630348	best: 0.5630348 (2337)	total: 4m 50s	remaining: 2m 24s
2338:	learn: 0.3288796	test: 0.5629889	best: 0.5629889 (2338)	total: 4m 51s	remaining: 2m 24s
2339:	learn: 0.3288527	test: 0.5630025	best: 0.5629889 (2338)	total: 4m 51s	remaining: 2m 24s
2340:	learn: 0.3287951	test: 0.5630239	best: 0.5629889 (2338

2418:	learn: 0.3242395	test: 0.5618320	best: 0.5618320 (2418)	total: 5m	remaining: 2m 14s
2419:	learn: 0.3241368	test: 0.5618445	best: 0.5618320 (2418)	total: 5m 1s	remaining: 2m 14s
2420:	learn: 0.3241047	test: 0.5618308	best: 0.5618308 (2420)	total: 5m 1s	remaining: 2m 14s
2421:	learn: 0.3240389	test: 0.5617890	best: 0.5617890 (2421)	total: 5m 1s	remaining: 2m 14s
2422:	learn: 0.3239357	test: 0.5617459	best: 0.5617459 (2422)	total: 5m 1s	remaining: 2m 13s
2423:	learn: 0.3239247	test: 0.5617645	best: 0.5617459 (2422)	total: 5m 1s	remaining: 2m 13s
2424:	learn: 0.3238945	test: 0.5617771	best: 0.5617459 (2422)	total: 5m 1s	remaining: 2m 13s
2425:	learn: 0.3238329	test: 0.5617733	best: 0.5617459 (2422)	total: 5m 1s	remaining: 2m 13s
2426:	learn: 0.3237162	test: 0.5616986	best: 0.5616986 (2426)	total: 5m 1s	remaining: 2m 13s
2427:	learn: 0.3236784	test: 0.5616863	best: 0.5616863 (2427)	total: 5m 2s	remaining: 2m 13s
2428:	learn: 0.3236255	test: 0.5616864	best: 0.5616863 (2427)	total: 5m 2

2508:	learn: 0.3190132	test: 0.5605049	best: 0.5604911 (2506)	total: 5m 12s	remaining: 2m 3s
2509:	learn: 0.3189151	test: 0.5605146	best: 0.5604911 (2506)	total: 5m 12s	remaining: 2m 3s
2510:	learn: 0.3188275	test: 0.5604605	best: 0.5604605 (2510)	total: 5m 12s	remaining: 2m 3s
2511:	learn: 0.3187801	test: 0.5604474	best: 0.5604474 (2511)	total: 5m 12s	remaining: 2m 3s
2512:	learn: 0.3187424	test: 0.5604369	best: 0.5604369 (2512)	total: 5m 12s	remaining: 2m 2s
2513:	learn: 0.3187021	test: 0.5604112	best: 0.5604112 (2513)	total: 5m 12s	remaining: 2m 2s
2514:	learn: 0.3186917	test: 0.5604125	best: 0.5604112 (2513)	total: 5m 13s	remaining: 2m 2s
2515:	learn: 0.3185942	test: 0.5603961	best: 0.5603961 (2515)	total: 5m 13s	remaining: 2m 2s
2516:	learn: 0.3185228	test: 0.5603600	best: 0.5603600 (2516)	total: 5m 13s	remaining: 2m 2s
2517:	learn: 0.3184694	test: 0.5603581	best: 0.5603581 (2517)	total: 5m 13s	remaining: 2m 2s
2518:	learn: 0.3184236	test: 0.5603280	best: 0.5603280 (2518)	total: 5

2597:	learn: 0.3136927	test: 0.5590140	best: 0.5590030 (2596)	total: 5m 23s	remaining: 1m 52s
2598:	learn: 0.3135752	test: 0.5589466	best: 0.5589466 (2598)	total: 5m 23s	remaining: 1m 52s
2599:	learn: 0.3135556	test: 0.5589362	best: 0.5589362 (2599)	total: 5m 23s	remaining: 1m 52s
2600:	learn: 0.3135459	test: 0.5589410	best: 0.5589362 (2599)	total: 5m 23s	remaining: 1m 51s
2601:	learn: 0.3135073	test: 0.5589328	best: 0.5589328 (2601)	total: 5m 24s	remaining: 1m 51s
2602:	learn: 0.3135025	test: 0.5589401	best: 0.5589328 (2601)	total: 5m 24s	remaining: 1m 51s
2603:	learn: 0.3134164	test: 0.5589149	best: 0.5589149 (2603)	total: 5m 24s	remaining: 1m 51s
2604:	learn: 0.3133167	test: 0.5588833	best: 0.5588833 (2604)	total: 5m 24s	remaining: 1m 51s
2605:	learn: 0.3132332	test: 0.5589109	best: 0.5588833 (2604)	total: 5m 24s	remaining: 1m 51s
2606:	learn: 0.3131412	test: 0.5589138	best: 0.5588833 (2604)	total: 5m 24s	remaining: 1m 51s
2607:	learn: 0.3130568	test: 0.5588915	best: 0.5588833 (2604

2685:	learn: 0.3091172	test: 0.5578635	best: 0.5578367 (2683)	total: 5m 34s	remaining: 1m 41s
2686:	learn: 0.3091044	test: 0.5578676	best: 0.5578367 (2683)	total: 5m 34s	remaining: 1m 41s
2687:	learn: 0.3090709	test: 0.5578658	best: 0.5578367 (2683)	total: 5m 34s	remaining: 1m 41s
2688:	learn: 0.3089269	test: 0.5578750	best: 0.5578367 (2683)	total: 5m 34s	remaining: 1m 40s
2689:	learn: 0.3088136	test: 0.5578506	best: 0.5578367 (2683)	total: 5m 34s	remaining: 1m 40s
2690:	learn: 0.3087777	test: 0.5578484	best: 0.5578367 (2683)	total: 5m 35s	remaining: 1m 40s
2691:	learn: 0.3087513	test: 0.5578405	best: 0.5578367 (2683)	total: 5m 35s	remaining: 1m 40s
2692:	learn: 0.3085737	test: 0.5578298	best: 0.5578298 (2692)	total: 5m 35s	remaining: 1m 40s
2693:	learn: 0.3084386	test: 0.5577434	best: 0.5577434 (2693)	total: 5m 35s	remaining: 1m 40s
2694:	learn: 0.3083933	test: 0.5577444	best: 0.5577434 (2693)	total: 5m 35s	remaining: 1m 40s
2695:	learn: 0.3083714	test: 0.5577465	best: 0.5577434 (2693

2774:	learn: 0.3042624	test: 0.5567905	best: 0.5567759 (2773)	total: 5m 45s	remaining: 1m 30s
2775:	learn: 0.3041905	test: 0.5567927	best: 0.5567759 (2773)	total: 5m 45s	remaining: 1m 30s
2776:	learn: 0.3041577	test: 0.5567564	best: 0.5567564 (2776)	total: 5m 45s	remaining: 1m 30s
2777:	learn: 0.3041119	test: 0.5567396	best: 0.5567396 (2777)	total: 5m 46s	remaining: 1m 29s
2778:	learn: 0.3040561	test: 0.5567291	best: 0.5567291 (2778)	total: 5m 46s	remaining: 1m 29s
2779:	learn: 0.3039985	test: 0.5566788	best: 0.5566788 (2779)	total: 5m 46s	remaining: 1m 29s
2780:	learn: 0.3039947	test: 0.5566911	best: 0.5566788 (2779)	total: 5m 46s	remaining: 1m 29s
2781:	learn: 0.3039767	test: 0.5567011	best: 0.5566788 (2779)	total: 5m 46s	remaining: 1m 29s
2782:	learn: 0.3039192	test: 0.5566904	best: 0.5566788 (2779)	total: 5m 46s	remaining: 1m 29s
2783:	learn: 0.3038581	test: 0.5566810	best: 0.5566788 (2779)	total: 5m 46s	remaining: 1m 29s
2784:	learn: 0.3038566	test: 0.5566845	best: 0.5566788 (2779

2863:	learn: 0.3004635	test: 0.5561687	best: 0.5561595 (2862)	total: 5m 57s	remaining: 1m 19s
2864:	learn: 0.3004156	test: 0.5561814	best: 0.5561595 (2862)	total: 5m 57s	remaining: 1m 19s
2865:	learn: 0.3003785	test: 0.5561712	best: 0.5561595 (2862)	total: 5m 57s	remaining: 1m 19s
2866:	learn: 0.3003425	test: 0.5561457	best: 0.5561457 (2866)	total: 5m 57s	remaining: 1m 18s
2867:	learn: 0.3003049	test: 0.5561275	best: 0.5561275 (2867)	total: 5m 57s	remaining: 1m 18s
2868:	learn: 0.3002735	test: 0.5561108	best: 0.5561108 (2868)	total: 5m 57s	remaining: 1m 18s
2869:	learn: 0.3002068	test: 0.5560818	best: 0.5560818 (2869)	total: 5m 57s	remaining: 1m 18s
2870:	learn: 0.3001968	test: 0.5560830	best: 0.5560818 (2869)	total: 5m 58s	remaining: 1m 18s
2871:	learn: 0.3001229	test: 0.5560500	best: 0.5560500 (2871)	total: 5m 58s	remaining: 1m 18s
2872:	learn: 0.3000950	test: 0.5560472	best: 0.5560472 (2872)	total: 5m 58s	remaining: 1m 18s
2873:	learn: 0.3000555	test: 0.5560266	best: 0.5560266 (2873

2952:	learn: 0.2965562	test: 0.5549412	best: 0.5549412 (2952)	total: 6m 8s	remaining: 1m 8s
2953:	learn: 0.2965409	test: 0.5549492	best: 0.5549412 (2952)	total: 6m 8s	remaining: 1m 8s
2954:	learn: 0.2965043	test: 0.5549669	best: 0.5549412 (2952)	total: 6m 8s	remaining: 1m 7s
2955:	learn: 0.2965010	test: 0.5549742	best: 0.5549412 (2952)	total: 6m 8s	remaining: 1m 7s
2956:	learn: 0.2964524	test: 0.5549503	best: 0.5549412 (2952)	total: 6m 8s	remaining: 1m 7s
2957:	learn: 0.2964450	test: 0.5549631	best: 0.5549412 (2952)	total: 6m 8s	remaining: 1m 7s
2958:	learn: 0.2964092	test: 0.5549680	best: 0.5549412 (2952)	total: 6m 8s	remaining: 1m 7s
2959:	learn: 0.2963872	test: 0.5549461	best: 0.5549412 (2952)	total: 6m 9s	remaining: 1m 7s
2960:	learn: 0.2963082	test: 0.5549601	best: 0.5549412 (2952)	total: 6m 9s	remaining: 1m 7s
2961:	learn: 0.2962999	test: 0.5549694	best: 0.5549412 (2952)	total: 6m 9s	remaining: 1m 7s
2962:	learn: 0.2962930	test: 0.5549852	best: 0.5549412 (2952)	total: 6m 9s	remai

3042:	learn: 0.2930504	test: 0.5543577	best: 0.5543577 (3042)	total: 6m 19s	remaining: 57s
3043:	learn: 0.2930163	test: 0.5543355	best: 0.5543355 (3043)	total: 6m 19s	remaining: 56.9s
3044:	learn: 0.2929548	test: 0.5543123	best: 0.5543123 (3044)	total: 6m 19s	remaining: 56.7s
3045:	learn: 0.2929444	test: 0.5543050	best: 0.5543050 (3045)	total: 6m 19s	remaining: 56.6s
3046:	learn: 0.2928914	test: 0.5542431	best: 0.5542431 (3046)	total: 6m 20s	remaining: 56.5s
3047:	learn: 0.2928217	test: 0.5542368	best: 0.5542368 (3047)	total: 6m 20s	remaining: 56.4s
3048:	learn: 0.2928012	test: 0.5542495	best: 0.5542368 (3047)	total: 6m 20s	remaining: 56.3s
3049:	learn: 0.2927849	test: 0.5542489	best: 0.5542368 (3047)	total: 6m 20s	remaining: 56.1s
3050:	learn: 0.2926913	test: 0.5542424	best: 0.5542368 (3047)	total: 6m 20s	remaining: 56s
3051:	learn: 0.2926595	test: 0.5542467	best: 0.5542368 (3047)	total: 6m 20s	remaining: 55.9s
3052:	learn: 0.2926581	test: 0.5542461	best: 0.5542368 (3047)	total: 6m 20

3132:	learn: 0.2900586	test: 0.5535272	best: 0.5535159 (3130)	total: 6m 30s	remaining: 45.8s
3133:	learn: 0.2900546	test: 0.5535257	best: 0.5535159 (3130)	total: 6m 31s	remaining: 45.7s
3134:	learn: 0.2899899	test: 0.5535100	best: 0.5535100 (3134)	total: 6m 31s	remaining: 45.5s
3135:	learn: 0.2899752	test: 0.5535037	best: 0.5535037 (3135)	total: 6m 31s	remaining: 45.4s
3136:	learn: 0.2899414	test: 0.5534977	best: 0.5534977 (3136)	total: 6m 31s	remaining: 45.3s
3137:	learn: 0.2899086	test: 0.5535107	best: 0.5534977 (3136)	total: 6m 31s	remaining: 45.2s
3138:	learn: 0.2898615	test: 0.5534778	best: 0.5534778 (3138)	total: 6m 31s	remaining: 45s
3139:	learn: 0.2898083	test: 0.5534404	best: 0.5534404 (3139)	total: 6m 31s	remaining: 44.9s
3140:	learn: 0.2897874	test: 0.5534546	best: 0.5534404 (3139)	total: 6m 31s	remaining: 44.8s
3141:	learn: 0.2897654	test: 0.5534612	best: 0.5534404 (3139)	total: 6m 32s	remaining: 44.7s
3142:	learn: 0.2897267	test: 0.5534576	best: 0.5534404 (3139)	total: 6m 

3222:	learn: 0.2865598	test: 0.5527496	best: 0.5526898 (3220)	total: 6m 42s	remaining: 34.6s
3223:	learn: 0.2864891	test: 0.5527235	best: 0.5526898 (3220)	total: 6m 42s	remaining: 34.4s
3224:	learn: 0.2864725	test: 0.5527265	best: 0.5526898 (3220)	total: 6m 42s	remaining: 34.3s
3225:	learn: 0.2864204	test: 0.5527158	best: 0.5526898 (3220)	total: 6m 42s	remaining: 34.2s
3226:	learn: 0.2864139	test: 0.5527060	best: 0.5526898 (3220)	total: 6m 42s	remaining: 34.1s
3227:	learn: 0.2863734	test: 0.5527166	best: 0.5526898 (3220)	total: 6m 42s	remaining: 33.9s
3228:	learn: 0.2863117	test: 0.5527014	best: 0.5526898 (3220)	total: 6m 43s	remaining: 33.8s
3229:	learn: 0.2862384	test: 0.5526771	best: 0.5526771 (3229)	total: 6m 43s	remaining: 33.7s
3230:	learn: 0.2861899	test: 0.5526848	best: 0.5526771 (3229)	total: 6m 43s	remaining: 33.6s
3231:	learn: 0.2861520	test: 0.5526673	best: 0.5526673 (3231)	total: 6m 43s	remaining: 33.5s
3232:	learn: 0.2861203	test: 0.5526626	best: 0.5526626 (3232)	total: 6

3312:	learn: 0.2833309	test: 0.5521123	best: 0.5521123 (3312)	total: 6m 53s	remaining: 23.3s
3313:	learn: 0.2833301	test: 0.5521139	best: 0.5521123 (3312)	total: 6m 53s	remaining: 23.2s
3314:	learn: 0.2833141	test: 0.5521143	best: 0.5521123 (3312)	total: 6m 53s	remaining: 23.1s
3315:	learn: 0.2832832	test: 0.5521313	best: 0.5521123 (3312)	total: 6m 53s	remaining: 23s
3316:	learn: 0.2832659	test: 0.5521429	best: 0.5521123 (3312)	total: 6m 54s	remaining: 22.8s
3317:	learn: 0.2832550	test: 0.5521370	best: 0.5521123 (3312)	total: 6m 54s	remaining: 22.7s
3318:	learn: 0.2831789	test: 0.5521439	best: 0.5521123 (3312)	total: 6m 54s	remaining: 22.6s
3319:	learn: 0.2831660	test: 0.5521516	best: 0.5521123 (3312)	total: 6m 54s	remaining: 22.5s
3320:	learn: 0.2831351	test: 0.5521482	best: 0.5521123 (3312)	total: 6m 54s	remaining: 22.3s
3321:	learn: 0.2831220	test: 0.5521589	best: 0.5521123 (3312)	total: 6m 54s	remaining: 22.2s
3322:	learn: 0.2831053	test: 0.5521568	best: 0.5521123 (3312)	total: 6m 

3403:	learn: 0.2804645	test: 0.5515680	best: 0.5515676 (3401)	total: 7m 5s	remaining: 12s
3404:	learn: 0.2804426	test: 0.5515591	best: 0.5515591 (3404)	total: 7m 5s	remaining: 11.9s
3405:	learn: 0.2803754	test: 0.5515258	best: 0.5515258 (3405)	total: 7m 5s	remaining: 11.7s
3406:	learn: 0.2803733	test: 0.5515269	best: 0.5515258 (3405)	total: 7m 5s	remaining: 11.6s
3407:	learn: 0.2803717	test: 0.5515267	best: 0.5515258 (3405)	total: 7m 5s	remaining: 11.5s
3408:	learn: 0.2803428	test: 0.5515225	best: 0.5515225 (3408)	total: 7m 5s	remaining: 11.4s
3409:	learn: 0.2803264	test: 0.5515158	best: 0.5515158 (3409)	total: 7m 5s	remaining: 11.2s
3410:	learn: 0.2803247	test: 0.5515166	best: 0.5515158 (3409)	total: 7m 6s	remaining: 11.1s
3411:	learn: 0.2803079	test: 0.5515164	best: 0.5515158 (3409)	total: 7m 6s	remaining: 11s
3412:	learn: 0.2803031	test: 0.5515254	best: 0.5515158 (3409)	total: 7m 6s	remaining: 10.9s
3413:	learn: 0.2802820	test: 0.5515263	best: 0.5515158 (3409)	total: 7m 6s	remaining

3492:	learn: 0.2779517	test: 0.5512390	best: 0.5511596 (3471)	total: 7m 16s	remaining: 875ms
3493:	learn: 0.2779468	test: 0.5512471	best: 0.5511596 (3471)	total: 7m 16s	remaining: 750ms
3494:	learn: 0.2779038	test: 0.5512442	best: 0.5511596 (3471)	total: 7m 16s	remaining: 625ms
3495:	learn: 0.2778549	test: 0.5512625	best: 0.5511596 (3471)	total: 7m 16s	remaining: 500ms
3496:	learn: 0.2778339	test: 0.5512561	best: 0.5511596 (3471)	total: 7m 16s	remaining: 375ms
3497:	learn: 0.2778196	test: 0.5512669	best: 0.5511596 (3471)	total: 7m 17s	remaining: 250ms
3498:	learn: 0.2777994	test: 0.5512572	best: 0.5511596 (3471)	total: 7m 17s	remaining: 125ms
3499:	learn: 0.2777804	test: 0.5512447	best: 0.5511596 (3471)	total: 7m 17s	remaining: 0us

bestTest = 0.5511596327
bestIteration = 3471

Shrink model to first 3472 iterations.


<catboost.core.CatBoostClassifier at 0x2224a344910>

In [8]:
env = gym.make("ALE/MsPacman-ram-v5", render_mode="rgb_array")

observations = []

observation, info = env.reset()
observation, reward, terminated, truncated, info = env.step(0)



while not terminated and not truncated:
    action = model.predict(observation)[0]
    observation, reward, terminated, truncated, info = env.step(action)
    observations.append(env.render())

  logger.warn(


In [9]:
video = np.array(observations)
figure = plt.figure()
images = plt.imshow(video[0, :, :, :])
plt.close()

def init():
    images.set_data(video[0, :, :, :])

def animate(i):
    images.set_data(video[i, :, :, :])
    return images

html_video = animation.FuncAnimation(figure, animate, 
                                     init_func=init, 
                                     frames=video.shape[0], 
                                     interval=50).to_html5_video()
display.HTML(html_video)