In [1]:
import numpy as np
import keras
import pickle
import zarr
import keras.backend as K
from keras.models import Model
from keras.layers import Input, Dense, Conv2D, Flatten, BatchNormalization, Activation
from keras import optimizers
from keras.callbacks import ModelCheckpoint
from keras.layers import *


class RL_Datapoint():
    def __init__(self, state, policy, values):
        self.state = state
        self.policy = policy
        self.values = values
        
def __read_file_data(ID, path='dataset/'):
    dataset = zarr.group(store=zarr.ZipStore(path + str(ID) +'.zip', mode="r"))
    X = np.array(dataset['states'])
    policies = np.array(dataset['policies'])
    values = np.array(dataset['values'])
    return X,policies,values

def __read_files_data(IDs, path='dataset/'):
    X = np.array([])
    for ID in IDs:
        if X.size==0:
            X, policies, values = __read_file_data(ID, path)
            values = np.array(values)
        else:
            X_ID, policies_ID, values_ID = __read_file_data(ID, path)
            X = np.concatenate((X,X_ID))
            policies = np.concatenate((policies, policies_ID))
            values = np.concatenate((values,np.array(values_ID)))
    return X,policies,values
        
    
    
def generator(batch_size, datasetFileIds, path='dataset/'):
    while True:
        np.random.shuffle(datasetFileIds)

        for file_step, file_id in enumerate(datasetFileIds): 
            X, policies, values = __read_file_data(file_id,path)
#             X = np.rollaxis(X, 1,4).shape
            rand_indices = np.arange(len(X))
            np.random.shuffle(rand_indices)

            for i in range(int(len(X)/batch_size)):
                batch_indices = rand_indices[i*batch_size: (i+1)*batch_size]
                yield X[batch_indices],[policies[batch_indices],values[batch_indices]]
                
def validation_generator(batch_size, datasetFileIds, path='dataset/'):
    while True:
        np.random.shuffle(datasetFileIds)

        for file_step, file_id in enumerate(datasetFileIds): 
            X, policies, values = __read_file_data(file_id,path)
#             X = np.rollaxis(X, 1,4).shape
            rand_indices = np.arange(len(X))
            np.random.shuffle(rand_indices)

            for i in range(int(len(X)/batch_size)):
                batch_indices = rand_indices[i*batch_size: (i+1)*batch_size]
                yield X[batch_indices],[policies[batch_indices],values[batch_indices]]
                
def plotHistory( history):
    import matplotlib.pyplot as plt

    val_loss = history.history['val_loss']
    val_policy_loss = history.history['val_policy_loss']
    val_value_loss = history.history['val_value_loss']
    loss = history.history['loss']
    policy_loss = history.history['policy_loss']
    value_loss = history.history['value_loss']
    
    epochs = range(1,len(loss) + 1)

    # fig, ax = plt.subplots(nrows=2, ncols=2)
    fig = plt.figure()

    plt.subplot(2, 2, 1)
    plt.plot(epochs,loss,'bo',label='loss')
    plt.plot(epochs,val_loss,'b',label='val_loss')
    plt.title = 'Training and validation loss'
    plt.legend()

    plt.subplot(2, 2, 2)
    plt.plot(epochs,policy_loss,'bo',label='policy_loss')
    plt.plot(epochs,val_policy_loss,'b',label='val_policy_loss')
    plt.title = 'Training and validation policy loss'
    plt.legend()        

    plt.subplot(2, 2, 3)
    plt.plot(epochs,value_loss,'bo',label='value_loss')
    plt.plot(epochs,val_value_loss,'b',label='val_value_loss')
    plt.title = 'Training and validation value loss'
    plt.legend()
    plt.show()
    
def acc_sign(y_true, y_pred):
    return K.mean(K.equal(K.sign(y_pred), K.sign(y_true)), axis=-1)


def acc_round(y_true, y_pred):
    # each interval for class -1, 0, 1 must have a width of 2/3 to be equally distributed
    # therefore you must convert (1/3) to (1/2) and only then round to the closest integer
    # 1/3 * x = 1/2
    return K.mean(K.equal(K.round(y_pred * 1.5), K.round(y_true)), axis=-1)

def acc_reg(y_true,y_pred):
    return K.constant(1) - K.square(K.mean((y_pred-y_true), axis=1))

def acc_round_unequal(y_true,y_pred):
    return K.mean(K.equal(K.round(y_true),K.round(y_pred)), axis=-1)

Using TensorFlow backend.


In [87]:
x, p, v = __read_files_data([0,1],dataset_path)
print(x.shape, p.shape, v.shape)
print(x.nbytes/1024/1024,'MB')

(20000, 60, 8, 8) (20000, 2272) (20000, 1)
585.9375 MB


In [2]:
def getResidualNetwork(input_shape, output_value=1, output_policy=2272):
    
    channel_pos = 'channels_first'
    inp_shape = Input(input_shape,name='input1')
    x = Conv2D(256, kernel_size=(3,3), padding = 'same', input_shape=input_shape,data_format=channel_pos,name='conv2d_Prep')(inp_shape)
    x = BatchNormalization(axis=1,name='batch_normalization_prep')(x)
    x_a1 = Activation('relu',name='activation_prep')(x)
    activated_x = x_a1
    
#     activated_x, x
    def createResidualBlock(block_nr, activated_x):
        nr = block_nr *2 -1
        x = Conv2D(256, kernel_size=(3,3), name = 'conv2d_'+str(nr), padding='same',data_format=channel_pos)(activated_x)
        x = BatchNormalization(axis=1, name = 'batch_normalization_'+str(nr))(x)
        x = Activation('relu',name = 'activation_'+str(nr))(x)
        x = Conv2D(256, kernel_size=(3,3), name = 'conv2d_'+str(nr+1),padding = 'same',data_format=channel_pos)(x)
        x = BatchNormalization(axis=1, name = 'batch_normalization_'+str(nr+1))(x)
        x = keras.layers.add([x,activated_x],name='add_' + str(block_nr))
        activated_x = Activation('relu',name='activation_'+str(nr+1))(x)
        return activated_x
    
    # build eight residual blocks
    for i in range (1,8):
        activated_x = createResidualBlock(i, activated_x)
        

    
    # Value header
    x = Conv2D(4, kernel_size=(1,1),name='value_conv2d', padding = 'same',data_format=channel_pos)(activated_x)
    xb = BatchNormalization(axis=1,name='value_batch_normalization')(x)
    xA = Activation('relu',name='value_activation')(xb)
    xF = Flatten(name='value_flatten')(xA)
    dense_1 = Dense(256, activation='relu',name='value_dense')(xF)
    value = Dense(output_value, activation='tanh', name='value')(dense_1)

    # Policy Header
    xConv = Conv2D(8, kernel_size=(7,7), padding = 'same',name='policy_conv2d',data_format=channel_pos)(activated_x)
    xb = BatchNormalization(axis=1,name='policy_batch_normalization')(xConv)
    xA = Activation('relu',name='policy_activation')(xb)
    xF = Flatten(name='policy_flatten')(xA)
    policy = Dense(output_policy, activation='softmax', name='policy')(xF)


    from keras.models import Model
    model = Model(inp_shape, [policy,value])

    model.summary()
    return model


<h3>NN Architecture: ResNet</h3>

<h3>Main Parameters of the NN</h3>

In [3]:
# ----------- parameters ----------------
files_len = 1000                                # amount of zip files
file_id_start = 0
file_ids = np.arange(file_id_start,files_len)               
# np.random.shuffle(file_ids)
train_ids = file_ids[:int(len(file_ids)*0.9)] # file_ids for training set
val_ids = file_ids[int(len(file_ids)*0.9):]   # file_ids for validation set 
filepath="models/model-{epoch:02d}.hdf5"      # path to save model
zip_length = 10000                            # amount of datapoints in a zip file
data_len = files_len * zip_length             # whole amount of datapoints in all zip files
batch_size = 256                              # batch size
steps_per_epoch = int((len(train_ids)*zip_length)/batch_size) # amount of batches in one epoch
CLASSES_LEN = 2272                            # amount of classes for policy
channel_pos = 'channels_last'          
dataset_path = 'dataset/'                     # relative directory to the dataset
inp_shape = (60,8,8)                          # shape of a datapoint
val_id = files_len -1 
x_val, policies_val, values_val = __read_file_data(6000,path=dataset_path)
print('train_ids:',np.min(train_ids),' - ', np.max(train_ids))
print('val_ids:',np.min(val_ids),' - ', np.max(val_ids))
print('x_val:', x_val.shape)

train_ids: 0  -  899
val_ids: 900  -  999
x_val: (10000, 60, 8, 8)


In [59]:
np.concatenate((x_val,x_val)).shape

(20000, 60, 8, 8)

In [97]:
def evaluate_model(model, file_ids, dataset_path):
    x_val, policies_val, values_val = __read_files_data(file_ids,path=dataset_path)
    print(model.metrics_names)
    print(model.evaluate(x_val,[policies_val,values_val]))

evaluate_model(model,[6001,6002,6003],dataset_path)

['loss', 'policy_loss', 'value_loss', 'policy_acc', 'value_acc_round', 'value_acc_sign']
[1.095079911295573, 1.8439676438967387, 0.8454506663044293, 0.5189, 0.23126666666666668, 0.5441666666666667]


In [94]:
x_val, policies_val, values_val = __read_files_data([6001],path=dataset_path)
print(x_val.shape,policies_val.shape)

(10000, 60, 8, 8) (10000, 2272)


<h3>Build the model</h3>

In [4]:
model = getResidualNetwork(inp_shape, output_policy=CLASSES_LEN)
sgd = optimizers.SGD(lr=0.000, momentum=0.9, decay=0.0, nesterov=False)

model.compile(loss={'policy':'categorical_crossentropy',
                    'value':'mean_squared_error'}, optimizer=sgd,
              metrics={'policy':'accuracy', 'value':[acc_round, acc_sign]}, loss_weights=[0.25,0.75])

Instructions for updating:
Colocations handled automatically by placer.
__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
input1 (InputLayer)             (None, 60, 8, 8)     0                                            
__________________________________________________________________________________________________
conv2d_Prep (Conv2D)            (None, 256, 8, 8)    138496      input1[0][0]                     
__________________________________________________________________________________________________
batch_normalization_prep (Batch (None, 256, 8, 8)    1024        conv2d_Prep[0][0]                
__________________________________________________________________________________________________
activation_prep (Activation)    (None, 256, 8, 8)    0           batch_normalization_prep[0][0]   
_____________________________________

In [5]:
model.load_weights('finalModel/model-05.hdf5')

In [6]:
model.evaluate(x_val,[policies_val,values_val],verbose=True)

UnknownError: Failed to get convolution algorithm. This is probably because cuDNN failed to initialize, so try looking to see if a warning log message was printed above.
	 [[{{node conv2d_Prep/convolution}}]]
	 [[{{node loss/add}}]]

In [98]:
x_val[0].shape

(60, 8, 8)

In [102]:
np.expand_dims(x_val[0],0).shape

(1, 60, 8, 8)

In [108]:
board = x_val[0][np.newaxis, :, :]
board.shape

(1, 60, 8, 8)

In [7]:
data = np.load('data.npy')

In [8]:
model.predict(data)

UnknownError: Failed to get convolution algorithm. This is probably because cuDNN failed to initialize, so try looking to see if a warning log message was printed above.
	 [[{{node conv2d_Prep/convolution}}]]
	 [[{{node policy/Softmax}}]]

In [107]:
model.predict(x_test)

[array([[8.0579248e-08, 1.4189803e-07, 1.6486984e-08, ..., 1.7541266e-08,
         9.9875290e-09, 1.2479663e-08]], dtype=float32),
 array([[0.07075516]], dtype=float32)]

<h3>Define callbacks</h3>

<h4>Callback for checkpoint and tensorboard</h4>

In [34]:
# callbacks 
from datetime import datetime
checkpoint = ModelCheckpoint(filepath, monitor='val_loss', verbose=1, save_best_only=True, save_weights_only=False, mode='auto', period=1)
logdir="logs/scalars/" + datetime.now().strftime("%Y%m%d-%H%M%S")
tensorboard_callback = keras.callbacks.TensorBoard(log_dir=logdir, update_freq='batch')

<h4>Callback for Learning rate</h4>

In [35]:
# learning rate
from  LearningRateScheduler import *
epochs = 5
batch_len = epochs * int(data_len/ (batch_size))
max_lr = 0.001*8
total_it = batch_len
min_lr = 0.0001
print('BatchLen: ', batch_len, ' - DataLen: ', data_len)
lr_schedule = OneCycleSchedule(start_lr=max_lr/8, max_lr=max_lr, cycle_length=total_it*.4, cooldown_length=total_it*.6, finish_lr=min_lr)
scheduler = LinearWarmUp(lr_schedule, start_lr=min_lr, length=total_it/30)
bt = BatchLearningRateScheduler(scheduler)

BatchLen:  195310  - DataLen:  10000000


In [36]:
callbacks_list = [checkpoint,tensorboard_callback,bt]
# callbacks_list = [checkpoint,bt]


In [37]:
from keras import backend
backend.set_image_dim_ordering('th')
print(backend.image_data_format())

channels_first


In [38]:
# model.save('models\\BughouseNet220620190437.h5')
history = model.fit_generator(generator(batch_size,train_ids,path=dataset_path), 
                                steps_per_epoch=int((len(train_ids)*zip_length)/batch_size), callbacks=callbacks_list,
                                epochs=epochs, validation_data=(x_val, [policies_val,values_val]))


Epoch 1/5
    3/35156 [..............................] - ETA: 10:55:13 - loss: 2.7828 - policy_loss: 7.8073 - value_loss: 1.1080 - policy_acc: 0.0000e+00 - value_acc_round: 0.3138 - value_acc_sign: 0.5234

  % delta_t_median)



Epoch 00001: val_loss improved from inf to 1.34624, saving model to models/model-01.hdf5
Epoch:  1  - lr: 0.006133369  - batch: 0  - epoch:  1
Epoch 2/5

Epoch 00002: val_loss improved from 1.34624 to 1.14354, saving model to models/model-02.hdf5
Epoch:  2  - lr: 0.003566595  - batch: 1  - epoch:  2
Epoch 3/5

Epoch 00003: val_loss improved from 1.14354 to 1.02987, saving model to models/model-03.hdf5
Epoch:  3  - lr: 0.0008399954  - batch: 2  - epoch:  3
Epoch 4/5

Epoch 00004: val_loss did not improve from 1.02987
Epoch:  4  - lr: 0.00056999386  - batch: 3  - epoch:  4
Epoch 5/5

Epoch 00005: val_loss did not improve from 1.02987
Epoch:  5  - lr: 0.00029999233  - batch: 4  - epoch:  5


In [39]:
model.save('models\\FinalModel05072019.h5')


In [None]:
# model.save('models\\BughouseNet220620190437.h5')
history = model.fit_generator(generator(batch_size,train_ids,path=dataset_path), steps_per_epoch=int((len(train_ids)*zip_length)/batch_size), callbacks=callbacks_list,
                    epochs=epochs, validation_data=(x_val, [policies_val,values_val]))


Instructions for updating:
Use tf.cast instead.
Epoch 1/5
    3/35156 [..............................] - ETA: 11:05:33 - loss: 2.6790 - policy_loss: 8.3141 - value_loss: 0.8006 - policy_acc: 0.0052 - value_acc_round: 0.0951

  % delta_t_median)


    4/35156 [..............................] - ETA: 9:23:09 - loss: 2.6764 - policy_loss: 8.3132 - value_loss: 0.7974 - policy_acc: 0.0059 - value_acc_round: 0.0957 

  % delta_t_median)


    5/35156 [..............................] - ETA: 7:55:19 - loss: 2.6645 - policy_loss: 8.2937 - value_loss: 0.7881 - policy_acc: 0.0055 - value_acc_round: 0.1055

  % delta_t_median)


   28/35156 [..............................] - ETA: 3:32:39 - loss: 2.6667 - policy_loss: 8.3003 - value_loss: 0.7888 - policy_acc: 0.0052 - value_acc_round: 0.1095

  % delta_t_median)


   31/35156 [..............................] - ETA: 3:25:03 - loss: 2.6594 - policy_loss: 8.2765 - value_loss: 0.7870 - policy_acc: 0.0058 - value_acc_round: 0.1081

  % delta_t_median)


  201/35156 [..............................] - ETA: 2:52:52 - loss: 2.5030 - policy_loss: 7.7552 - value_loss: 0.7523 - policy_acc: 0.0350 - value_acc_round: 0.1096

  % delta_t_median)


  202/35156 [..............................] - ETA: 2:53:16 - loss: 2.5026 - policy_loss: 7.7540 - value_loss: 0.7522 - policy_acc: 0.0350 - value_acc_round: 0.1096

  % delta_t_median)


  203/35156 [..............................] - ETA: 2:53:08 - loss: 2.5020 - policy_loss: 7.7523 - value_loss: 0.7519 - policy_acc: 0.0352 - value_acc_round: 0.1096

  % delta_t_median)


  204/35156 [..............................] - ETA: 2:53:32 - loss: 2.5018 - policy_loss: 7.7509 - value_loss: 0.7521 - policy_acc: 0.0353 - value_acc_round: 0.1095

  % delta_t_median)


  208/35156 [..............................] - ETA: 2:53:55 - loss: 2.4988 - policy_loss: 7.7409 - value_loss: 0.7514 - policy_acc: 0.0361 - value_acc_round: 0.1098

  % delta_t_median)


  210/35156 [..............................] - ETA: 2:54:01 - loss: 2.4978 - policy_loss: 7.7378 - value_loss: 0.7511 - policy_acc: 0.0362 - value_acc_round: 0.1100

  % delta_t_median)


  212/35156 [..............................] - ETA: 2:54:14 - loss: 2.4961 - policy_loss: 7.7320 - value_loss: 0.7508 - policy_acc: 0.0367 - value_acc_round: 0.1102

  % delta_t_median)


  213/35156 [..............................] - ETA: 2:54:00 - loss: 2.4958 - policy_loss: 7.7308 - value_loss: 0.7508 - policy_acc: 0.0368 - value_acc_round: 0.1102

  % delta_t_median)


  257/35156 [..............................] - ETA: 2:55:28 - loss: 2.4681 - policy_loss: 7.6274 - value_loss: 0.7483 - policy_acc: 0.0431 - value_acc_round: 0.1097

  % delta_t_median)


  258/35156 [..............................] - ETA: 2:55:40 - loss: 2.4674 - policy_loss: 7.6241 - value_loss: 0.7485 - policy_acc: 0.0433 - value_acc_round: 0.1097

  % delta_t_median)


  259/35156 [..............................] - ETA: 2:56:01 - loss: 2.4670 - policy_loss: 7.6228 - value_loss: 0.7484 - policy_acc: 0.0434 - value_acc_round: 0.1097

  % delta_t_median)


  264/35156 [..............................] - ETA: 2:55:30 - loss: 2.4647 - policy_loss: 7.6129 - value_loss: 0.7486 - policy_acc: 0.0440 - value_acc_round: 0.1093

  % delta_t_median)


  334/35156 [..............................] - ETA: 2:51:26 - loss: 2.4208 - policy_loss: 7.4375 - value_loss: 0.7485 - policy_acc: 0.0548 - value_acc_round: 0.1082

  % delta_t_median)


  340/35156 [..............................] - ETA: 2:51:18 - loss: 2.4171 - policy_loss: 7.4220 - value_loss: 0.7489 - policy_acc: 0.0555 - value_acc_round: 0.1080

  % delta_t_median)


  408/35156 [..............................] - ETA: 2:50:30 - loss: 2.3859 - policy_loss: 7.2956 - value_loss: 0.7493 - policy_acc: 0.0618 - value_acc_round: 0.1038

  % delta_t_median)


  409/35156 [..............................] - ETA: 2:50:41 - loss: 2.3855 - policy_loss: 7.2942 - value_loss: 0.7493 - policy_acc: 0.0619 - value_acc_round: 0.1037

  % delta_t_median)


  431/35156 [..............................] - ETA: 2:49:46 - loss: 2.3759 - policy_loss: 7.2546 - value_loss: 0.7496 - policy_acc: 0.0638 - value_acc_round: 0.1021

  % delta_t_median)


  432/35156 [..............................] - ETA: 2:50:01 - loss: 2.3754 - policy_loss: 7.2523 - value_loss: 0.7498 - policy_acc: 0.0639 - value_acc_round: 0.1020

  % delta_t_median)


  433/35156 [..............................] - ETA: 2:49:55 - loss: 2.3748 - policy_loss: 7.2497 - value_loss: 0.7498 - policy_acc: 0.0640 - value_acc_round: 0.1019

  % delta_t_median)


  476/35156 [..............................] - ETA: 2:48:54 - loss: 2.3539 - policy_loss: 7.1609 - value_loss: 0.7516 - policy_acc: 0.0685 - value_acc_round: 0.0982

  % delta_t_median)


  477/35156 [..............................] - ETA: 2:49:03 - loss: 2.3534 - policy_loss: 7.1589 - value_loss: 0.7516 - policy_acc: 0.0686 - value_acc_round: 0.0982

  % delta_t_median)


  562/35156 [..............................] - ETA: 2:47:21 - loss: 2.3187 - policy_loss: 7.0180 - value_loss: 0.7523 - policy_acc: 0.0764 - value_acc_round: 0.0923

  % delta_t_median)


  564/35156 [..............................] - ETA: 2:47:22 - loss: 2.3180 - policy_loss: 7.0149 - value_loss: 0.7523 - policy_acc: 0.0766 - value_acc_round: 0.0921

  % delta_t_median)


  567/35156 [..............................] - ETA: 2:47:07 - loss: 2.3170 - policy_loss: 7.0104 - value_loss: 0.7525 - policy_acc: 0.0769 - value_acc_round: 0.0918

  % delta_t_median)


  718/35156 [..............................] - ETA: 2:44:38 - loss: 2.2599 - policy_loss: 6.7859 - value_loss: 0.7512 - policy_acc: 0.0888 - value_acc_round: 0.0822

  % delta_t_median)


  720/35156 [..............................] - ETA: 2:44:39 - loss: 2.2591 - policy_loss: 6.7828 - value_loss: 0.7512 - policy_acc: 0.0891 - value_acc_round: 0.0822

  % delta_t_median)


  723/35156 [..............................] - ETA: 2:44:49 - loss: 2.2579 - policy_loss: 6.7781 - value_loss: 0.7511 - policy_acc: 0.0893 - value_acc_round: 0.0820

  % delta_t_median)


  729/35156 [..............................] - ETA: 2:44:49 - loss: 2.2556 - policy_loss: 6.7695 - value_loss: 0.7509 - policy_acc: 0.0898 - value_acc_round: 0.0819

  % delta_t_median)


  863/35156 [..............................] - ETA: 2:42:57 - loss: 2.2152 - policy_loss: 6.6113 - value_loss: 0.7498 - policy_acc: 0.0986 - value_acc_round: 0.0779

  % delta_t_median)


  864/35156 [..............................] - ETA: 2:42:55 - loss: 2.2150 - policy_loss: 6.6104 - value_loss: 0.7498 - policy_acc: 0.0986 - value_acc_round: 0.0779

  % delta_t_median)


  902/35156 [..............................] - ETA: 2:42:25 - loss: 2.2038 - policy_loss: 6.5689 - value_loss: 0.7488 - policy_acc: 0.1011 - value_acc_round: 0.0777

  % delta_t_median)


  917/35156 [..............................] - ETA: 2:42:36 - loss: 2.2005 - policy_loss: 6.5549 - value_loss: 0.7490 - policy_acc: 0.1018 - value_acc_round: 0.0772

  % delta_t_median)


  918/35156 [..............................] - ETA: 2:42:33 - loss: 2.2003 - policy_loss: 6.5540 - value_loss: 0.7490 - policy_acc: 0.1019 - value_acc_round: 0.0772

  % delta_t_median)


  919/35156 [..............................] - ETA: 2:42:40 - loss: 2.2001 - policy_loss: 6.5532 - value_loss: 0.7491 - policy_acc: 0.1019 - value_acc_round: 0.0772

  % delta_t_median)


  920/35156 [..............................] - ETA: 2:42:45 - loss: 2.1999 - policy_loss: 6.5522 - value_loss: 0.7492 - policy_acc: 0.1020 - value_acc_round: 0.0771

  % delta_t_median)


  921/35156 [..............................] - ETA: 2:42:42 - loss: 2.1997 - policy_loss: 6.5513 - value_loss: 0.7491 - policy_acc: 0.1020 - value_acc_round: 0.0771

  % delta_t_median)


  923/35156 [..............................] - ETA: 2:42:44 - loss: 2.1992 - policy_loss: 6.5492 - value_loss: 0.7492 - policy_acc: 0.1021 - value_acc_round: 0.0770

  % delta_t_median)


  924/35156 [..............................] - ETA: 2:42:49 - loss: 2.1990 - policy_loss: 6.5484 - value_loss: 0.7492 - policy_acc: 0.1022 - value_acc_round: 0.0770

  % delta_t_median)


  925/35156 [..............................] - ETA: 2:42:54 - loss: 2.1988 - policy_loss: 6.5475 - value_loss: 0.7492 - policy_acc: 0.1022 - value_acc_round: 0.0770

  % delta_t_median)


  926/35156 [..............................] - ETA: 2:42:52 - loss: 2.1985 - policy_loss: 6.5461 - value_loss: 0.7493 - policy_acc: 0.1023 - value_acc_round: 0.0769

  % delta_t_median)


  927/35156 [..............................] - ETA: 2:42:49 - loss: 2.1983 - policy_loss: 6.5454 - value_loss: 0.7493 - policy_acc: 0.1024 - value_acc_round: 0.0769

  % delta_t_median)


  928/35156 [..............................] - ETA: 2:42:47 - loss: 2.1980 - policy_loss: 6.5442 - value_loss: 0.7493 - policy_acc: 0.1024 - value_acc_round: 0.0768

  % delta_t_median)


  942/35156 [..............................] - ETA: 2:42:48 - loss: 2.1942 - policy_loss: 6.5295 - value_loss: 0.7491 - policy_acc: 0.1033 - value_acc_round: 0.0767

  % delta_t_median)


  944/35156 [..............................] - ETA: 2:42:42 - loss: 2.1937 - policy_loss: 6.5275 - value_loss: 0.7491 - policy_acc: 0.1034 - value_acc_round: 0.0767

  % delta_t_median)


  965/35156 [..............................] - ETA: 2:42:33 - loss: 2.1879 - policy_loss: 6.5074 - value_loss: 0.7480 - policy_acc: 0.1046 - value_acc_round: 0.0770

  % delta_t_median)


  967/35156 [..............................] - ETA: 2:42:37 - loss: 2.1874 - policy_loss: 6.5059 - value_loss: 0.7479 - policy_acc: 0.1046 - value_acc_round: 0.0770

  % delta_t_median)


 1096/35156 [..............................] - ETA: 2:40:57 - loss: 2.1623 - policy_loss: 6.4079 - value_loss: 0.7471 - policy_acc: 0.1095 - value_acc_round: 0.0769

  % delta_t_median)


 1099/35156 [..............................] - ETA: 2:41:04 - loss: 2.1617 - policy_loss: 6.4057 - value_loss: 0.7471 - policy_acc: 0.1095 - value_acc_round: 0.0769

  % delta_t_median)


 1101/35156 [..............................] - ETA: 2:41:06 - loss: 2.1614 - policy_loss: 6.4042 - value_loss: 0.7471 - policy_acc: 0.1096 - value_acc_round: 0.0769

  % delta_t_median)


 1102/35156 [..............................] - ETA: 2:41:04 - loss: 2.1613 - policy_loss: 6.4037 - value_loss: 0.7471 - policy_acc: 0.1096 - value_acc_round: 0.0769

  % delta_t_median)


 1104/35156 [..............................] - ETA: 2:41:00 - loss: 2.1609 - policy_loss: 6.4024 - value_loss: 0.7471 - policy_acc: 0.1097 - value_acc_round: 0.0768

  % delta_t_median)


 1132/35156 [..............................] - ETA: 2:40:45 - loss: 2.1551 - policy_loss: 6.3786 - value_loss: 0.7473 - policy_acc: 0.1112 - value_acc_round: 0.0768

  % delta_t_median)


 1164/35156 [..............................] - ETA: 2:40:37 - loss: 2.1486 - policy_loss: 6.3536 - value_loss: 0.7469 - policy_acc: 0.1128 - value_acc_round: 0.0767

  % delta_t_median)


 1165/35156 [..............................] - ETA: 2:40:40 - loss: 2.1484 - policy_loss: 6.3530 - value_loss: 0.7469 - policy_acc: 0.1128 - value_acc_round: 0.0767

  % delta_t_median)


 1167/35156 [..............................] - ETA: 2:40:36 - loss: 2.1480 - policy_loss: 6.3514 - value_loss: 0.7469 - policy_acc: 0.1129 - value_acc_round: 0.0767

  % delta_t_median)


 1169/35156 [..............................] - ETA: 2:40:38 - loss: 2.1476 - policy_loss: 6.3498 - value_loss: 0.7469 - policy_acc: 0.1131 - value_acc_round: 0.0767

  % delta_t_median)


 1235/35156 [>.............................] - ETA: 2:39:45 - loss: 2.1349 - policy_loss: 6.3002 - value_loss: 0.7465 - policy_acc: 0.1161 - value_acc_round: 0.0767

  % delta_t_median)


 1238/35156 [>.............................] - ETA: 2:39:45 - loss: 2.1342 - policy_loss: 6.2978 - value_loss: 0.7464 - policy_acc: 0.1162 - value_acc_round: 0.0767

  % delta_t_median)


 1291/35156 [>.............................] - ETA: 2:39:31 - loss: 2.1245 - policy_loss: 6.2603 - value_loss: 0.7459 - policy_acc: 0.1186 - value_acc_round: 0.0770

  % delta_t_median)


 1293/35156 [>.............................] - ETA: 2:39:34 - loss: 2.1242 - policy_loss: 6.2590 - value_loss: 0.7460 - policy_acc: 0.1187 - value_acc_round: 0.0770

  % delta_t_median)


 1295/35156 [>.............................] - ETA: 2:39:35 - loss: 2.1240 - policy_loss: 6.2578 - value_loss: 0.7460 - policy_acc: 0.1187 - value_acc_round: 0.0770

  % delta_t_median)


 1296/35156 [>.............................] - ETA: 2:39:32 - loss: 2.1238 - policy_loss: 6.2571 - value_loss: 0.7461 - policy_acc: 0.1187 - value_acc_round: 0.0770

  % delta_t_median)


 1300/35156 [>.............................] - ETA: 2:39:36 - loss: 2.1233 - policy_loss: 6.2543 - value_loss: 0.7463 - policy_acc: 0.1189 - value_acc_round: 0.0770

  % delta_t_median)


 1330/35156 [>.............................] - ETA: 2:39:19 - loss: 2.1190 - policy_loss: 6.2341 - value_loss: 0.7472 - policy_acc: 0.1201 - value_acc_round: 0.0768

  % delta_t_median)


 1331/35156 [>.............................] - ETA: 2:39:22 - loss: 2.1187 - policy_loss: 6.2333 - value_loss: 0.7472 - policy_acc: 0.1201 - value_acc_round: 0.0768

  % delta_t_median)


 1333/35156 [>.............................] - ETA: 2:39:24 - loss: 2.1184 - policy_loss: 6.2319 - value_loss: 0.7472 - policy_acc: 0.1202 - value_acc_round: 0.0769

  % delta_t_median)


 1335/35156 [>.............................] - ETA: 2:39:26 - loss: 2.1180 - policy_loss: 6.2304 - value_loss: 0.7472 - policy_acc: 0.1203 - value_acc_round: 0.0769

  % delta_t_median)


 1337/35156 [>.............................] - ETA: 2:39:22 - loss: 2.1176 - policy_loss: 6.2287 - value_loss: 0.7472 - policy_acc: 0.1205 - value_acc_round: 0.0769

  % delta_t_median)


 1364/35156 [>.............................] - ETA: 2:39:11 - loss: 2.1123 - policy_loss: 6.2087 - value_loss: 0.7468 - policy_acc: 0.1219 - value_acc_round: 0.0771

  % delta_t_median)


 1432/35156 [>.............................] - ETA: 2:38:26 - loss: 2.1023 - policy_loss: 6.1716 - value_loss: 0.7459 - policy_acc: 0.1240 - value_acc_round: 0.0769

  % delta_t_median)


 1433/35156 [>.............................] - ETA: 2:38:30 - loss: 2.1021 - policy_loss: 6.1711 - value_loss: 0.7458 - policy_acc: 0.1240 - value_acc_round: 0.0769

  % delta_t_median)


 1438/35156 [>.............................] - ETA: 2:38:27 - loss: 2.1013 - policy_loss: 6.1686 - value_loss: 0.7456 - policy_acc: 0.1242 - value_acc_round: 0.0769

  % delta_t_median)


 1452/35156 [>.............................] - ETA: 2:38:26 - loss: 2.0994 - policy_loss: 6.1621 - value_loss: 0.7451 - policy_acc: 0.1245 - value_acc_round: 0.0772

  % delta_t_median)


 1492/35156 [>.............................] - ETA: 2:37:29 - loss: 2.0941 - policy_loss: 6.1413 - value_loss: 0.7450 - policy_acc: 0.1258 - value_acc_round: 0.0776

  % delta_t_median)


 1498/35156 [>.............................] - ETA: 2:37:28 - loss: 2.0932 - policy_loss: 6.1374 - value_loss: 0.7451 - policy_acc: 0.1261 - value_acc_round: 0.0777

  % delta_t_median)


 1797/35156 [>.............................] - ETA: 2:30:53 - loss: 2.0546 - policy_loss: 5.9887 - value_loss: 0.7433 - policy_acc: 0.1363 - value_acc_round: 0.0795

  % delta_t_median)


 1799/35156 [>.............................] - ETA: 2:30:54 - loss: 2.0544 - policy_loss: 5.9876 - value_loss: 0.7433 - policy_acc: 0.1364 - value_acc_round: 0.0796

  % delta_t_median)


 1963/35156 [>.............................] - ETA: 2:28:08 - loss: 2.0334 - policy_loss: 5.9084 - value_loss: 0.7417 - policy_acc: 0.1426 - value_acc_round: 0.0816

  % delta_t_median)


 1964/35156 [>.............................] - ETA: 2:28:11 - loss: 2.0333 - policy_loss: 5.9079 - value_loss: 0.7417 - policy_acc: 0.1426 - value_acc_round: 0.0816

  % delta_t_median)


 1968/35156 [>.............................] - ETA: 2:28:11 - loss: 2.0330 - policy_loss: 5.9065 - value_loss: 0.7418 - policy_acc: 0.1427 - value_acc_round: 0.0816

  % delta_t_median)


 1970/35156 [>.............................] - ETA: 2:28:08 - loss: 2.0327 - policy_loss: 5.9056 - value_loss: 0.7418 - policy_acc: 0.1428 - value_acc_round: 0.0817

  % delta_t_median)


 2012/35156 [>.............................] - ETA: 2:27:42 - loss: 2.0271 - policy_loss: 5.8847 - value_loss: 0.7412 - policy_acc: 0.1444 - value_acc_round: 0.0822

  % delta_t_median)


 2295/35156 [>.............................] - ETA: 2:23:28 - loss: 1.9945 - policy_loss: 5.7621 - value_loss: 0.7387 - policy_acc: 0.1544 - value_acc_round: 0.0863

  % delta_t_median)


 2456/35156 [=>............................] - ETA: 2:21:25 - loss: 1.9773 - policy_loss: 5.6943 - value_loss: 0.7383 - policy_acc: 0.1603 - value_acc_round: 0.0877

  % delta_t_median)


 2460/35156 [=>............................] - ETA: 2:21:26 - loss: 1.9768 - policy_loss: 5.6925 - value_loss: 0.7383 - policy_acc: 0.1605 - value_acc_round: 0.0877

  % delta_t_median)


 2531/35156 [=>............................] - ETA: 2:20:51 - loss: 1.9693 - policy_loss: 5.6613 - value_loss: 0.7386 - policy_acc: 0.1632 - value_acc_round: 0.0875

  % delta_t_median)


 2898/35156 [=>............................] - ETA: 2:17:02 - loss: 1.9336 - policy_loss: 5.5202 - value_loss: 0.7380 - policy_acc: 0.1761 - value_acc_round: 0.0887

  % delta_t_median)


 3185/35156 [=>............................] - ETA: 2:14:24 - loss: 1.9093 - policy_loss: 5.4264 - value_loss: 0.7369 - policy_acc: 0.1848 - value_acc_round: 0.0899

  % delta_t_median)


 3229/35156 [=>............................] - ETA: 2:14:10 - loss: 1.9055 - policy_loss: 5.4122 - value_loss: 0.7366 - policy_acc: 0.1861 - value_acc_round: 0.0902

  % delta_t_median)


 4253/35156 [==>...........................] - ETA: 2:05:09 - loss: 1.8175 - policy_loss: 5.0649 - value_loss: 0.7351 - policy_acc: 0.2202 - value_acc_round: 0.0939 ETA: 2:05:27 - loss: 

  % delta_t_median)


 4618/35156 [==>...........................] - ETA: 2:02:43 - loss: 1.7905 - policy_loss: 4.9576 - value_loss: 0.7347 - policy_acc: 0.2306 - value_acc_round: 0.0955

  % delta_t_median)


 5580/35156 [===>..........................] - ETA: 1:56:56 - loss: 1.7230 - policy_loss: 4.6876 - value_loss: 0.7348 - policy_acc: 0.2573 - value_acc_round: 0.0964

  % delta_t_median)


 5582/35156 [===>..........................] - ETA: 1:56:56 - loss: 1.7229 - policy_loss: 4.6870 - value_loss: 0.7348 - policy_acc: 0.2574 - value_acc_round: 0.0964

  % delta_t_median)


 6300/35156 [====>.........................] - ETA: 1:52:40 - loss: 1.6761 - policy_loss: 4.5009 - value_loss: 0.7345 - policy_acc: 0.2757 - value_acc_round: 0.0970

  % delta_t_median)


 6303/35156 [====>.........................] - ETA: 1:52:43 - loss: 1.6759 - policy_loss: 4.5003 - value_loss: 0.7345 - policy_acc: 0.2758 - value_acc_round: 0.0970

  % delta_t_median)


 6304/35156 [====>.........................] - ETA: 1:52:43 - loss: 1.6759 - policy_loss: 4.5001 - value_loss: 0.7345 - policy_acc: 0.2758 - value_acc_round: 0.0970

  % delta_t_median)


 6306/35156 [====>.........................] - ETA: 1:52:43 - loss: 1.6758 - policy_loss: 4.4997 - value_loss: 0.7345 - policy_acc: 0.2758 - value_acc_round: 0.0970

  % delta_t_median)


 6309/35156 [====>.........................] - ETA: 1:52:45 - loss: 1.6756 - policy_loss: 4.4989 - value_loss: 0.7345 - policy_acc: 0.2759 - value_acc_round: 0.0970

  % delta_t_median)


 6310/35156 [====>.........................] - ETA: 1:52:45 - loss: 1.6755 - policy_loss: 4.4987 - value_loss: 0.7345 - policy_acc: 0.2759 - value_acc_round: 0.0970

  % delta_t_median)


 6311/35156 [====>.........................] - ETA: 1:52:46 - loss: 1.6755 - policy_loss: 4.4985 - value_loss: 0.7345 - policy_acc: 0.2759 - value_acc_round: 0.0970

  % delta_t_median)


 6312/35156 [====>.........................] - ETA: 1:52:47 - loss: 1.6754 - policy_loss: 4.4982 - value_loss: 0.7345 - policy_acc: 0.2760 - value_acc_round: 0.0970

  % delta_t_median)


 6313/35156 [====>.........................] - ETA: 1:52:48 - loss: 1.6753 - policy_loss: 4.4979 - value_loss: 0.7345 - policy_acc: 0.2760 - value_acc_round: 0.0970

  % delta_t_median)


 6314/35156 [====>.........................] - ETA: 1:52:49 - loss: 1.6753 - policy_loss: 4.4977 - value_loss: 0.7345 - policy_acc: 0.2760 - value_acc_round: 0.0971

  % delta_t_median)


 6315/35156 [====>.........................] - ETA: 1:52:50 - loss: 1.6752 - policy_loss: 4.4975 - value_loss: 0.7345 - policy_acc: 0.2760 - value_acc_round: 0.0971

  % delta_t_median)


 6322/35156 [====>.........................] - ETA: 1:52:54 - loss: 1.6748 - policy_loss: 4.4958 - value_loss: 0.7345 - policy_acc: 0.2762 - value_acc_round: 0.0971

  % delta_t_median)


 6324/35156 [====>.........................] - ETA: 1:52:53 - loss: 1.6746 - policy_loss: 4.4952 - value_loss: 0.7345 - policy_acc: 0.2762 - value_acc_round: 0.0971

  % delta_t_median)


 6325/35156 [====>.........................] - ETA: 1:52:53 - loss: 1.6746 - policy_loss: 4.4950 - value_loss: 0.7345 - policy_acc: 0.2763 - value_acc_round: 0.0971

  % delta_t_median)
  % delta_t_median)


 6580/35156 [====>.........................] - ETA: 1:51:24 - loss: 1.6589 - policy_loss: 4.4333 - value_loss: 0.7341 - policy_acc: 0.2824 - value_acc_round: 0.0975

  % delta_t_median)


 6586/35156 [====>.........................] - ETA: 1:51:23 - loss: 1.6585 - policy_loss: 4.4319 - value_loss: 0.7341 - policy_acc: 0.2825 - value_acc_round: 0.0975

  % delta_t_median)


 6594/35156 [====>.........................] - ETA: 1:51:23 - loss: 1.6581 - policy_loss: 4.4303 - value_loss: 0.7341 - policy_acc: 0.2827 - value_acc_round: 0.0975

  % delta_t_median)


 7585/35156 [=====>........................] - ETA: 1:46:15 - loss: 1.6033 - policy_loss: 4.2140 - value_loss: 0.7331 - policy_acc: 0.3037 - value_acc_round: 0.0993

  % delta_t_median)


 7750/35156 [=====>........................] - ETA: 1:45:37 - loss: 1.5942 - policy_loss: 4.1792 - value_loss: 0.7326 - policy_acc: 0.3071 - value_acc_round: 0.1000

  % delta_t_median)


 7762/35156 [=====>........................] - ETA: 1:45:37 - loss: 1.5936 - policy_loss: 4.1768 - value_loss: 0.7326 - policy_acc: 0.3073 - value_acc_round: 0.1001

  % delta_t_median)


 7763/35156 [=====>........................] - ETA: 1:45:37 - loss: 1.5936 - policy_loss: 4.1766 - value_loss: 0.7326 - policy_acc: 0.3074 - value_acc_round: 0.1001

  % delta_t_median)


 7894/35156 [=====>........................] - ETA: 1:45:06 - loss: 1.5866 - policy_loss: 4.1489 - value_loss: 0.7325 - policy_acc: 0.3101 - value_acc_round: 0.1002

  % delta_t_median)


 7928/35156 [=====>........................] - ETA: 1:45:01 - loss: 1.5847 - policy_loss: 4.1415 - value_loss: 0.7324 - policy_acc: 0.3109 - value_acc_round: 0.1003

  % delta_t_median)


 7945/35156 [=====>........................] - ETA: 1:45:00 - loss: 1.5838 - policy_loss: 4.1378 - value_loss: 0.7325 - policy_acc: 0.3113 - value_acc_round: 0.1003

  % delta_t_median)


 7948/35156 [=====>........................] - ETA: 1:45:01 - loss: 1.5836 - policy_loss: 4.1371 - value_loss: 0.7325 - policy_acc: 0.3114 - value_acc_round: 0.1003

  % delta_t_median)
  % delta_t_median)


 7951/35156 [=====>........................] - ETA: 1:45:00 - loss: 1.5835 - policy_loss: 4.1364 - value_loss: 0.7325 - policy_acc: 0.3115 - value_acc_round: 0.1003

  % delta_t_median)


 8003/35156 [=====>........................] - ETA: 1:44:51 - loss: 1.5810 - policy_loss: 4.1261 - value_loss: 0.7326 - policy_acc: 0.3125 - value_acc_round: 0.1002

  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)



Epoch 00001: val_loss improved from inf to 1.05520, saving model to models/model-01.hdf5
Epoch:  1  - lr: 0.006133369  - batch: 0  - epoch:  1
Epoch 2/5
   26/35156 [..............................] - ETA: 2:27:12 - loss: 0.8499 - policy_loss: 1.4544 - value_loss: 0.6484 - policy_acc: 0.6086 - value_acc_round: 0.2300

  % delta_t_median)


   27/35156 [..............................] - ETA: 2:30:04 - loss: 0.8555 - policy_loss: 1.4625 - value_loss: 0.6532 - policy_acc: 0.6056 - value_acc_round: 0.2279

  % delta_t_median)


   79/35156 [..............................] - ETA: 2:22:51 - loss: 0.8882 - policy_loss: 1.5048 - value_loss: 0.6826 - policy_acc: 0.5953 - value_acc_round: 0.1901

  % delta_t_median)


  143/35156 [..............................] - ETA: 2:18:25 - loss: 0.8936 - policy_loss: 1.5319 - value_loss: 0.6808 - policy_acc: 0.5888 - value_acc_round: 0.1813

  % delta_t_median)


  527/35156 [..............................] - ETA: 2:09:23 - loss: 0.8940 - policy_loss: 1.5470 - value_loss: 0.6763 - policy_acc: 0.5849 - value_acc_round: 0.1884

  % delta_t_median)


  530/35156 [..............................] - ETA: 2:09:43 - loss: 0.8939 - policy_loss: 1.5475 - value_loss: 0.6760 - policy_acc: 0.5848 - value_acc_round: 0.1889

  % delta_t_median)


  543/35156 [..............................] - ETA: 2:10:37 - loss: 0.8962 - policy_loss: 1.5499 - value_loss: 0.6783 - policy_acc: 0.5842 - value_acc_round: 0.1889

  % delta_t_median)


  710/35156 [..............................] - ETA: 2:10:31 - loss: 0.9015 - policy_loss: 1.5537 - value_loss: 0.6841 - policy_acc: 0.5834 - value_acc_round: 0.1785

  % delta_t_median)


 1124/35156 [..............................] - ETA: 2:09:50 - loss: 0.9037 - policy_loss: 1.5594 - value_loss: 0.6852 - policy_acc: 0.5830 - value_acc_round: 0.1782

  % delta_t_median)


 1146/35156 [..............................] - ETA: 2:10:09 - loss: 0.9044 - policy_loss: 1.5620 - value_loss: 0.6851 - policy_acc: 0.5823 - value_acc_round: 0.1778

  % delta_t_median)


 1150/35156 [..............................] - ETA: 2:10:15 - loss: 0.9043 - policy_loss: 1.5623 - value_loss: 0.6850 - policy_acc: 0.5822 - value_acc_round: 0.1778

  % delta_t_median)


 1221/35156 [>.............................] - ETA: 2:10:23 - loss: 0.9041 - policy_loss: 1.5601 - value_loss: 0.6855 - policy_acc: 0.5829 - value_acc_round: 0.1774

  % delta_t_median)


 1225/35156 [>.............................] - ETA: 2:10:28 - loss: 0.9040 - policy_loss: 1.5599 - value_loss: 0.6853 - policy_acc: 0.5829 - value_acc_round: 0.1774

  % delta_t_median)


 1255/35156 [>.............................] - ETA: 2:10:43 - loss: 0.9047 - policy_loss: 1.5619 - value_loss: 0.6856 - policy_acc: 0.5823 - value_acc_round: 0.1773

  % delta_t_median)


 1287/35156 [>.............................] - ETA: 2:11:07 - loss: 0.9047 - policy_loss: 1.5623 - value_loss: 0.6855 - policy_acc: 0.5822 - value_acc_round: 0.1781

  % delta_t_median)


 1564/35156 [>.............................] - ETA: 2:09:00 - loss: 0.9012 - policy_loss: 1.5598 - value_loss: 0.6817 - policy_acc: 0.5828 - value_acc_round: 0.1853

  % delta_t_median)


 1686/35156 [>.............................] - ETA: 2:08:31 - loss: 0.9027 - policy_loss: 1.5575 - value_loss: 0.6844 - policy_acc: 0.5833 - value_acc_round: 0.1810

  % delta_t_median)


 1689/35156 [>.............................] - ETA: 2:08:36 - loss: 0.9026 - policy_loss: 1.5573 - value_loss: 0.6843 - policy_acc: 0.5834 - value_acc_round: 0.1809

  % delta_t_median)


 1692/35156 [>.............................] - ETA: 2:08:37 - loss: 0.9025 - policy_loss: 1.5572 - value_loss: 0.6842 - policy_acc: 0.5834 - value_acc_round: 0.1810

  % delta_t_median)


 1763/35156 [>.............................] - ETA: 2:08:02 - loss: 0.9032 - policy_loss: 1.5566 - value_loss: 0.6854 - policy_acc: 0.5833 - value_acc_round: 0.1792

  % delta_t_median)


 1769/35156 [>.............................] - ETA: 2:08:05 - loss: 0.9031 - policy_loss: 1.5564 - value_loss: 0.6854 - policy_acc: 0.5834 - value_acc_round: 0.1791

  % delta_t_median)


 2268/35156 [>.............................] - ETA: 2:04:40 - loss: 0.9045 - policy_loss: 1.5547 - value_loss: 0.6877 - policy_acc: 0.5832 - value_acc_round: 0.1753

  % delta_t_median)


 2269/35156 [>.............................] - ETA: 2:04:43 - loss: 0.9044 - policy_loss: 1.5548 - value_loss: 0.6877 - policy_acc: 0.5832 - value_acc_round: 0.1754

  % delta_t_median)


 2271/35156 [>.............................] - ETA: 2:04:42 - loss: 0.9044 - policy_loss: 1.5548 - value_loss: 0.6876 - policy_acc: 0.5832 - value_acc_round: 0.1754

  % delta_t_median)


 2273/35156 [>.............................] - ETA: 2:04:43 - loss: 0.9044 - policy_loss: 1.5549 - value_loss: 0.6875 - policy_acc: 0.5832 - value_acc_round: 0.1755

  % delta_t_median)


 2328/35156 [>.............................] - ETA: 2:04:38 - loss: 0.9045 - policy_loss: 1.5560 - value_loss: 0.6873 - policy_acc: 0.5830 - value_acc_round: 0.1763 ETA: 2:04:32 - loss: 0.9045 - policy_loss: 1.5556 - value_loss: 0.6875 

  % delta_t_median)


 2329/35156 [>.............................] - ETA: 2:04:41 - loss: 0.9045 - policy_loss: 1.5559 - value_loss: 0.6873 - policy_acc: 0.5830 - value_acc_round: 0.1763

  % delta_t_median)


 2333/35156 [>.............................] - ETA: 2:04:40 - loss: 0.9046 - policy_loss: 1.5558 - value_loss: 0.6875 - policy_acc: 0.5830 - value_acc_round: 0.1763

  % delta_t_median)


 2434/35156 [=>............................] - ETA: 2:03:58 - loss: 0.9044 - policy_loss: 1.5554 - value_loss: 0.6874 - policy_acc: 0.5830 - value_acc_round: 0.1762

  % delta_t_median)


 2457/35156 [=>............................] - ETA: 2:04:07 - loss: 0.9042 - policy_loss: 1.5548 - value_loss: 0.6873 - policy_acc: 0.5831 - value_acc_round: 0.1767

  % delta_t_median)


 2459/35156 [=>............................] - ETA: 2:04:08 - loss: 0.9041 - policy_loss: 1.5546 - value_loss: 0.6873 - policy_acc: 0.5831 - value_acc_round: 0.1767

  % delta_t_median)


 2651/35156 [=>............................] - ETA: 2:03:28 - loss: 0.9053 - policy_loss: 1.5530 - value_loss: 0.6894 - policy_acc: 0.5837 - value_acc_round: 0.1738

  % delta_t_median)


 2653/35156 [=>............................] - ETA: 2:03:29 - loss: 0.9053 - policy_loss: 1.5530 - value_loss: 0.6894 - policy_acc: 0.5837 - value_acc_round: 0.1738

  % delta_t_median)


 2654/35156 [=>............................] - ETA: 2:03:28 - loss: 0.9053 - policy_loss: 1.5530 - value_loss: 0.6893 - policy_acc: 0.5837 - value_acc_round: 0.1738

  % delta_t_median)


 2782/35156 [=>............................] - ETA: 2:03:01 - loss: 0.9048 - policy_loss: 1.5502 - value_loss: 0.6896 - policy_acc: 0.5842 - value_acc_round: 0.1738

  % delta_t_median)


 2783/35156 [=>............................] - ETA: 2:03:03 - loss: 0.9048 - policy_loss: 1.5501 - value_loss: 0.6896 - policy_acc: 0.5842 - value_acc_round: 0.1738

  % delta_t_median)


 2954/35156 [=>............................] - ETA: 2:02:34 - loss: 0.9050 - policy_loss: 1.5500 - value_loss: 0.6899 - policy_acc: 0.5843 - value_acc_round: 0.1735

  % delta_t_median)


 2961/35156 [=>............................] - ETA: 2:02:39 - loss: 0.9051 - policy_loss: 1.5500 - value_loss: 0.6901 - policy_acc: 0.5843 - value_acc_round: 0.1734

  % delta_t_median)


 2963/35156 [=>............................] - ETA: 2:02:37 - loss: 0.9051 - policy_loss: 1.5499 - value_loss: 0.6901 - policy_acc: 0.5843 - value_acc_round: 0.1733

  % delta_t_median)


 3078/35156 [=>............................] - ETA: 2:02:09 - loss: 0.9053 - policy_loss: 1.5480 - value_loss: 0.6910 - policy_acc: 0.5847 - value_acc_round: 0.1723 ETA: 2:02:06 - loss: 0.9050 - policy_loss: 1.5482 - value_loss: 0.6905 - policy

  % delta_t_median)


 3080/35156 [=>............................] - ETA: 2:02:10 - loss: 0.9053 - policy_loss: 1.5480 - value_loss: 0.6910 - policy_acc: 0.5847 - value_acc_round: 0.1722

  % delta_t_median)
  % delta_t_median)


 3205/35156 [=>............................] - ETA: 2:01:43 - loss: 0.9048 - policy_loss: 1.5450 - value_loss: 0.6914 - policy_acc: 0.5855 - value_acc_round: 0.1709

  % delta_t_median)


 3207/35156 [=>............................] - ETA: 2:01:41 - loss: 0.9047 - policy_loss: 1.5451 - value_loss: 0.6913 - policy_acc: 0.5855 - value_acc_round: 0.1710

  % delta_t_median)


 3211/35156 [=>............................] - ETA: 2:01:41 - loss: 0.9046 - policy_loss: 1.5451 - value_loss: 0.6911 - policy_acc: 0.5855 - value_acc_round: 0.1712

  % delta_t_median)


 3218/35156 [=>............................] - ETA: 2:01:45 - loss: 0.9043 - policy_loss: 1.5450 - value_loss: 0.6907 - policy_acc: 0.5855 - value_acc_round: 0.1717

  % delta_t_median)


 3302/35156 [=>............................] - ETA: 2:01:31 - loss: 0.9043 - policy_loss: 1.5437 - value_loss: 0.6912 - policy_acc: 0.5857 - value_acc_round: 0.1722

  % delta_t_median)


 3741/35156 [==>...........................] - ETA: 1:59:18 - loss: 0.9029 - policy_loss: 1.5387 - value_loss: 0.6910 - policy_acc: 0.5864 - value_acc_round: 0.1727

  % delta_t_median)


 3794/35156 [==>...........................] - ETA: 1:59:07 - loss: 0.9027 - policy_loss: 1.5401 - value_loss: 0.6902 - policy_acc: 0.5862 - value_acc_round: 0.1738

  % delta_t_median)


 3830/35156 [==>...........................] - ETA: 1:59:05 - loss: 0.9029 - policy_loss: 1.5403 - value_loss: 0.6904 - policy_acc: 0.5861 - value_acc_round: 0.1739

  % delta_t_median)


 3993/35156 [==>...........................] - ETA: 1:58:16 - loss: 0.9030 - policy_loss: 1.5419 - value_loss: 0.6900 - policy_acc: 0.5856 - value_acc_round: 0.1742

  % delta_t_median)


 3994/35156 [==>...........................] - ETA: 1:58:17 - loss: 0.9030 - policy_loss: 1.5419 - value_loss: 0.6900 - policy_acc: 0.5856 - value_acc_round: 0.1743

  % delta_t_median)


 3996/35156 [==>...........................] - ETA: 1:58:18 - loss: 0.9029 - policy_loss: 1.5419 - value_loss: 0.6899 - policy_acc: 0.5855 - value_acc_round: 0.1743

  % delta_t_median)


 4112/35156 [==>...........................] - ETA: 1:57:33 - loss: 0.9027 - policy_loss: 1.5418 - value_loss: 0.6897 - policy_acc: 0.5856 - value_acc_round: 0.1747

  % delta_t_median)


 4114/35156 [==>...........................] - ETA: 1:57:34 - loss: 0.9027 - policy_loss: 1.5418 - value_loss: 0.6896 - policy_acc: 0.5856 - value_acc_round: 0.1748

  % delta_t_median)


 4247/35156 [==>...........................] - ETA: 1:56:59 - loss: 0.9026 - policy_loss: 1.5422 - value_loss: 0.6894 - policy_acc: 0.5854 - value_acc_round: 0.1754

  % delta_t_median)


 4249/35156 [==>...........................] - ETA: 1:57:00 - loss: 0.9027 - policy_loss: 1.5422 - value_loss: 0.6895 - policy_acc: 0.5854 - value_acc_round: 0.1754

  % delta_t_median)


 4252/35156 [==>...........................] - ETA: 1:57:00 - loss: 0.9027 - policy_loss: 1.5422 - value_loss: 0.6895 - policy_acc: 0.5854 - value_acc_round: 0.1754

  % delta_t_median)


 4280/35156 [==>...........................] - ETA: 1:56:58 - loss: 0.9028 - policy_loss: 1.5423 - value_loss: 0.6896 - policy_acc: 0.5854 - value_acc_round: 0.1750

  % delta_t_median)


 4286/35156 [==>...........................] - ETA: 1:56:57 - loss: 0.9028 - policy_loss: 1.5422 - value_loss: 0.6897 - policy_acc: 0.5854 - value_acc_round: 0.1749

  % delta_t_median)


 4409/35156 [==>...........................] - ETA: 1:56:35 - loss: 0.9022 - policy_loss: 1.5406 - value_loss: 0.6894 - policy_acc: 0.5857 - value_acc_round: 0.1751 ETA: 1:56:36 - loss: 0.9022 - policy_loss: 1.5406 - v

  % delta_t_median)


 4478/35156 [==>...........................] - ETA: 1:56:22 - loss: 0.9022 - policy_loss: 1.5410 - value_loss: 0.6892 - policy_acc: 0.5856 - value_acc_round: 0.1753

  % delta_t_median)


 4539/35156 [==>...........................] - ETA: 1:56:16 - loss: 0.9021 - policy_loss: 1.5411 - value_loss: 0.6891 - policy_acc: 0.5856 - value_acc_round: 0.1753

  % delta_t_median)


 4540/35156 [==>...........................] - ETA: 1:56:16 - loss: 0.9021 - policy_loss: 1.5411 - value_loss: 0.6891 - policy_acc: 0.5856 - value_acc_round: 0.1753

  % delta_t_median)


 4542/35156 [==>...........................] - ETA: 1:56:17 - loss: 0.9020 - policy_loss: 1.5410 - value_loss: 0.6891 - policy_acc: 0.5856 - value_acc_round: 0.1753

  % delta_t_median)


 4544/35156 [==>...........................] - ETA: 1:56:17 - loss: 0.9020 - policy_loss: 1.5410 - value_loss: 0.6890 - policy_acc: 0.5856 - value_acc_round: 0.1754

  % delta_t_median)


 5034/35156 [===>..........................] - ETA: 1:54:15 - loss: 0.9019 - policy_loss: 1.5407 - value_loss: 0.6890 - policy_acc: 0.5856 - value_acc_round: 0.1752

  % delta_t_median)


 5466/35156 [===>..........................] - ETA: 1:52:39 - loss: 0.9010 - policy_loss: 1.5422 - value_loss: 0.6872 - policy_acc: 0.5853 - value_acc_round: 0.1774

  % delta_t_median)


 5469/35156 [===>..........................] - ETA: 1:52:40 - loss: 0.9009 - policy_loss: 1.5422 - value_loss: 0.6872 - policy_acc: 0.5853 - value_acc_round: 0.1775

  % delta_t_median)
  % delta_t_median)


 5587/35156 [===>..........................] - ETA: 1:52:15 - loss: 0.9009 - policy_loss: 1.5420 - value_loss: 0.6872 - policy_acc: 0.5853 - value_acc_round: 0.1777

  % delta_t_median)


 5589/35156 [===>..........................] - ETA: 1:52:15 - loss: 0.9009 - policy_loss: 1.5420 - value_loss: 0.6871 - policy_acc: 0.5853 - value_acc_round: 0.1778

  % delta_t_median)


 5591/35156 [===>..........................] - ETA: 1:52:15 - loss: 0.9008 - policy_loss: 1.5419 - value_loss: 0.6871 - policy_acc: 0.5854 - value_acc_round: 0.1778

  % delta_t_median)


 5613/35156 [===>..........................] - ETA: 1:52:14 - loss: 0.9007 - policy_loss: 1.5417 - value_loss: 0.6871 - policy_acc: 0.5854 - value_acc_round: 0.1779

  % delta_t_median)


 5621/35156 [===>..........................] - ETA: 1:52:14 - loss: 0.9007 - policy_loss: 1.5415 - value_loss: 0.6871 - policy_acc: 0.5854 - value_acc_round: 0.1779

  % delta_t_median)
  % delta_t_median)


 5634/35156 [===>..........................] - ETA: 1:52:15 - loss: 0.9005 - policy_loss: 1.5412 - value_loss: 0.6869 - policy_acc: 0.5855 - value_acc_round: 0.1781

  % delta_t_median)


 5636/35156 [===>..........................] - ETA: 1:52:15 - loss: 0.9004 - policy_loss: 1.5412 - value_loss: 0.6869 - policy_acc: 0.5855 - value_acc_round: 0.1781

  % delta_t_median)


 5640/35156 [===>..........................] - ETA: 1:52:15 - loss: 0.9004 - policy_loss: 1.5410 - value_loss: 0.6869 - policy_acc: 0.5856 - value_acc_round: 0.1782

  % delta_t_median)


 5642/35156 [===>..........................] - ETA: 1:52:15 - loss: 0.9004 - policy_loss: 1.5410 - value_loss: 0.6869 - policy_acc: 0.5856 - value_acc_round: 0.1782

  % delta_t_median)


 5670/35156 [===>..........................] - ETA: 1:52:15 - loss: 0.9004 - policy_loss: 1.5408 - value_loss: 0.6869 - policy_acc: 0.5856 - value_acc_round: 0.1781

  % delta_t_median)


 5880/35156 [====>.........................] - ETA: 1:51:35 - loss: 0.8997 - policy_loss: 1.5388 - value_loss: 0.6867 - policy_acc: 0.5860 - value_acc_round: 0.1785

  % delta_t_median)


 6065/35156 [====>.........................] - ETA: 1:50:43 - loss: 0.9002 - policy_loss: 1.5404 - value_loss: 0.6868 - policy_acc: 0.5857 - value_acc_round: 0.1783

  % delta_t_median)


 6099/35156 [====>.........................] - ETA: 1:50:41 - loss: 0.9004 - policy_loss: 1.5406 - value_loss: 0.6870 - policy_acc: 0.5857 - value_acc_round: 0.1781

  % delta_t_median)


 6262/35156 [====>.........................] - ETA: 1:49:57 - loss: 0.9000 - policy_loss: 1.5399 - value_loss: 0.6868 - policy_acc: 0.5859 - value_acc_round: 0.1784

  % delta_t_median)


 6265/35156 [====>.........................] - ETA: 1:49:58 - loss: 0.9001 - policy_loss: 1.5399 - value_loss: 0.6869 - policy_acc: 0.5859 - value_acc_round: 0.1784

  % delta_t_median)


 6300/35156 [====>.........................] - ETA: 1:49:49 - loss: 0.9001 - policy_loss: 1.5401 - value_loss: 0.6868 - policy_acc: 0.5858 - value_acc_round: 0.1784

  % delta_t_median)


 6457/35156 [====>.........................] - ETA: 1:49:19 - loss: 0.9000 - policy_loss: 1.5390 - value_loss: 0.6870 - policy_acc: 0.5860 - value_acc_round: 0.1781

  % delta_t_median)


 7106/35156 [=====>........................] - ETA: 1:46:22 - loss: 0.9003 - policy_loss: 1.5425 - value_loss: 0.6862 - policy_acc: 0.5854 - value_acc_round: 0.1798

  % delta_t_median)


 7220/35156 [=====>........................] - ETA: 1:46:00 - loss: 0.9007 - policy_loss: 1.5432 - value_loss: 0.6865 - policy_acc: 0.5852 - value_acc_round: 0.1794

  % delta_t_median)


 7226/35156 [=====>........................] - ETA: 1:45:59 - loss: 0.9006 - policy_loss: 1.5432 - value_loss: 0.6865 - policy_acc: 0.5852 - value_acc_round: 0.1794

  % delta_t_median)


 7392/35156 [=====>........................] - ETA: 1:45:32 - loss: 0.9008 - policy_loss: 1.5437 - value_loss: 0.6865 - policy_acc: 0.5851 - value_acc_round: 0.1793

  % delta_t_median)


 7394/35156 [=====>........................] - ETA: 1:45:32 - loss: 0.9008 - policy_loss: 1.5437 - value_loss: 0.6865 - policy_acc: 0.5851 - value_acc_round: 0.1793

  % delta_t_median)


 7444/35156 [=====>........................] - ETA: 1:45:26 - loss: 0.9007 - policy_loss: 1.5436 - value_loss: 0.6864 - policy_acc: 0.5851 - value_acc_round: 0.1796 ETA: 1:45:33 - loss: 

  % delta_t_median)


 7485/35156 [=====>........................] - ETA: 1:45:18 - loss: 0.9006 - policy_loss: 1.5435 - value_loss: 0.6863 - policy_acc: 0.5852 - value_acc_round: 0.1797

  % delta_t_median)


 7487/35156 [=====>........................] - ETA: 1:45:17 - loss: 0.9006 - policy_loss: 1.5435 - value_loss: 0.6864 - policy_acc: 0.5852 - value_acc_round: 0.1796

  % delta_t_median)


 7760/35156 [=====>........................] - ETA: 1:44:11 - loss: 0.9009 - policy_loss: 1.5446 - value_loss: 0.6864 - policy_acc: 0.5849 - value_acc_round: 0.1798

  % delta_t_median)


 7762/35156 [=====>........................] - ETA: 1:44:11 - loss: 0.9009 - policy_loss: 1.5446 - value_loss: 0.6864 - policy_acc: 0.5849 - value_acc_round: 0.1798

  % delta_t_median)


 7765/35156 [=====>........................] - ETA: 1:44:12 - loss: 0.9009 - policy_loss: 1.5446 - value_loss: 0.6864 - policy_acc: 0.5849 - value_acc_round: 0.1798

  % delta_t_median)


 7872/35156 [=====>........................] - ETA: 1:43:47 - loss: 0.9007 - policy_loss: 1.5439 - value_loss: 0.6863 - policy_acc: 0.5851 - value_acc_round: 0.1801

  % delta_t_median)


 7942/35156 [=====>........................] - ETA: 1:43:35 - loss: 0.9006 - policy_loss: 1.5439 - value_loss: 0.6861 - policy_acc: 0.5851 - value_acc_round: 0.1802

  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)



Epoch 00002: val_loss improved from 1.05520 to 0.96251, saving model to models/model-02.hdf5
Epoch:  2  - lr: 0.003566595  - batch: 1  - epoch:  2
Epoch 3/5
    3/35156 [..............................] - ETA: 2:24:45 - loss: 0.8765 - policy_loss: 1.3621 - value_loss: 0.7147 - policy_acc: 0.6146 - value_acc_round: 0.1198

  % delta_t_median)


  916/35156 [..............................] - ETA: 2:09:30 - loss: 0.8519 - policy_loss: 1.3644 - value_loss: 0.6810 - policy_acc: 0.6179 - value_acc_round: 0.1837

  % delta_t_median)


  918/35156 [..............................] - ETA: 2:09:42 - loss: 0.8518 - policy_loss: 1.3644 - value_loss: 0.6809 - policy_acc: 0.6179 - value_acc_round: 0.1837

  % delta_t_median)


  958/35156 [..............................] - ETA: 2:09:59 - loss: 0.8515 - policy_loss: 1.3625 - value_loss: 0.6811 - policy_acc: 0.6180 - value_acc_round: 0.1834

  % delta_t_median)


 1030/35156 [..............................] - ETA: 2:10:01 - loss: 0.8510 - policy_loss: 1.3625 - value_loss: 0.6805 - policy_acc: 0.6182 - value_acc_round: 0.1835

  % delta_t_median)


 1059/35156 [..............................] - ETA: 2:10:09 - loss: 0.8506 - policy_loss: 1.3642 - value_loss: 0.6794 - policy_acc: 0.6177 - value_acc_round: 0.1852

  % delta_t_median)


 1065/35156 [..............................] - ETA: 2:10:13 - loss: 0.8512 - policy_loss: 1.3645 - value_loss: 0.6801 - policy_acc: 0.6176 - value_acc_round: 0.1851

  % delta_t_median)


 1126/35156 [..............................] - ETA: 2:10:26 - loss: 0.8521 - policy_loss: 1.3658 - value_loss: 0.6809 - policy_acc: 0.6172 - value_acc_round: 0.1838

  % delta_t_median)


 1590/35156 [>.............................] - ETA: 2:06:44 - loss: 0.8490 - policy_loss: 1.3647 - value_loss: 0.6770 - policy_acc: 0.6176 - value_acc_round: 0.1898

  % delta_t_median)


 1593/35156 [>.............................] - ETA: 2:06:44 - loss: 0.8489 - policy_loss: 1.3649 - value_loss: 0.6769 - policy_acc: 0.6176 - value_acc_round: 0.1898

  % delta_t_median)


 1675/35156 [>.............................] - ETA: 2:06:30 - loss: 0.8491 - policy_loss: 1.3640 - value_loss: 0.6775 - policy_acc: 0.6178 - value_acc_round: 0.1888

  % delta_t_median)


 1750/35156 [>.............................] - ETA: 2:06:29 - loss: 0.8482 - policy_loss: 1.3604 - value_loss: 0.6774 - policy_acc: 0.6185 - value_acc_round: 0.1892

  % delta_t_median)


 1752/35156 [>.............................] - ETA: 2:06:28 - loss: 0.8481 - policy_loss: 1.3603 - value_loss: 0.6774 - policy_acc: 0.6185 - value_acc_round: 0.1892

  % delta_t_median)


 1981/35156 [>.............................] - ETA: 2:05:31 - loss: 0.8487 - policy_loss: 1.3605 - value_loss: 0.6781 - policy_acc: 0.6182 - value_acc_round: 0.1889

  % delta_t_median)


 2006/35156 [>.............................] - ETA: 2:05:39 - loss: 0.8489 - policy_loss: 1.3604 - value_loss: 0.6784 - policy_acc: 0.6182 - value_acc_round: 0.1886

  % delta_t_median)


 2113/35156 [>.............................] - ETA: 2:04:47 - loss: 0.8495 - policy_loss: 1.3614 - value_loss: 0.6789 - policy_acc: 0.6182 - value_acc_round: 0.1873

  % delta_t_median)


 2116/35156 [>.............................] - ETA: 2:04:51 - loss: 0.8495 - policy_loss: 1.3612 - value_loss: 0.6789 - policy_acc: 0.6182 - value_acc_round: 0.1873

  % delta_t_median)


 2349/35156 [=>............................] - ETA: 2:04:04 - loss: 0.8494 - policy_loss: 1.3613 - value_loss: 0.6787 - policy_acc: 0.6182 - value_acc_round: 0.1872

  % delta_t_median)


 2357/35156 [=>............................] - ETA: 2:04:10 - loss: 0.8492 - policy_loss: 1.3608 - value_loss: 0.6787 - policy_acc: 0.6183 - value_acc_round: 0.1872

  % delta_t_median)


 2654/35156 [=>............................] - ETA: 2:03:27 - loss: 0.8497 - policy_loss: 1.3566 - value_loss: 0.6808 - policy_acc: 0.6190 - value_acc_round: 0.1843

  % delta_t_median)


 2726/35156 [=>............................] - ETA: 2:03:16 - loss: 0.8494 - policy_loss: 1.3555 - value_loss: 0.6807 - policy_acc: 0.6193 - value_acc_round: 0.1843

  % delta_t_median)


 2727/35156 [=>............................] - ETA: 2:03:18 - loss: 0.8494 - policy_loss: 1.3554 - value_loss: 0.6807 - policy_acc: 0.6193 - value_acc_round: 0.1843

  % delta_t_median)


 2730/35156 [=>............................] - ETA: 2:03:18 - loss: 0.8493 - policy_loss: 1.3554 - value_loss: 0.6806 - policy_acc: 0.6193 - value_acc_round: 0.1843

  % delta_t_median)


 2960/35156 [=>............................] - ETA: 2:02:11 - loss: 0.8486 - policy_loss: 1.3522 - value_loss: 0.6807 - policy_acc: 0.6199 - value_acc_round: 0.1839

  % delta_t_median)


 3021/35156 [=>............................] - ETA: 2:02:08 - loss: 0.8486 - policy_loss: 1.3525 - value_loss: 0.6806 - policy_acc: 0.6198 - value_acc_round: 0.1846

  % delta_t_median)


 3031/35156 [=>............................] - ETA: 2:02:12 - loss: 0.8487 - policy_loss: 1.3524 - value_loss: 0.6807 - policy_acc: 0.6199 - value_acc_round: 0.1845

  % delta_t_median)


 3098/35156 [=>............................] - ETA: 2:01:53 - loss: 0.8488 - policy_loss: 1.3528 - value_loss: 0.6808 - policy_acc: 0.6199 - value_acc_round: 0.1841

  % delta_t_median)


 3274/35156 [=>............................] - ETA: 2:01:12 - loss: 0.8488 - policy_loss: 1.3512 - value_loss: 0.6813 - policy_acc: 0.6203 - value_acc_round: 0.1837

  % delta_t_median)


 3310/35156 [=>............................] - ETA: 2:01:09 - loss: 0.8490 - policy_loss: 1.3509 - value_loss: 0.6817 - policy_acc: 0.6204 - value_acc_round: 0.1832

  % delta_t_median)


 3375/35156 [=>............................] - ETA: 2:00:58 - loss: 0.8491 - policy_loss: 1.3503 - value_loss: 0.6821 - policy_acc: 0.6205 - value_acc_round: 0.1823 ETA: 2:00:55 - loss: 0.8490 - policy_loss: 1.3505 - value_loss: 0.6819 - policy

  % delta_t_median)


 3376/35156 [=>............................] - ETA: 2:01:00 - loss: 0.8491 - policy_loss: 1.3502 - value_loss: 0.6821 - policy_acc: 0.6205 - value_acc_round: 0.1823

  % delta_t_median)


 3377/35156 [=>............................] - ETA: 2:01:01 - loss: 0.8491 - policy_loss: 1.3502 - value_loss: 0.6821 - policy_acc: 0.6205 - value_acc_round: 0.1823

  % delta_t_median)


 3379/35156 [=>............................] - ETA: 2:01:00 - loss: 0.8491 - policy_loss: 1.3502 - value_loss: 0.6821 - policy_acc: 0.6205 - value_acc_round: 0.1823

  % delta_t_median)


 3412/35156 [=>............................] - ETA: 2:00:53 - loss: 0.8493 - policy_loss: 1.3502 - value_loss: 0.6824 - policy_acc: 0.6205 - value_acc_round: 0.1821

  % delta_t_median)


 3418/35156 [=>............................] - ETA: 2:00:53 - loss: 0.8494 - policy_loss: 1.3503 - value_loss: 0.6825 - policy_acc: 0.6205 - value_acc_round: 0.1819

  % delta_t_median)


 3708/35156 [==>...........................] - ETA: 1:59:30 - loss: 0.8508 - policy_loss: 1.3524 - value_loss: 0.6835 - policy_acc: 0.6201 - value_acc_round: 0.1797

  % delta_t_median)


 3910/35156 [==>...........................] - ETA: 1:58:40 - loss: 0.8517 - policy_loss: 1.3526 - value_loss: 0.6847 - policy_acc: 0.6200 - value_acc_round: 0.1784

  % delta_t_median)


 3911/35156 [==>...........................] - ETA: 1:58:41 - loss: 0.8517 - policy_loss: 1.3526 - value_loss: 0.6847 - policy_acc: 0.6200 - value_acc_round: 0.1784

  % delta_t_median)


 3915/35156 [==>...........................] - ETA: 1:58:42 - loss: 0.8518 - policy_loss: 1.3527 - value_loss: 0.6848 - policy_acc: 0.6199 - value_acc_round: 0.1784

  % delta_t_median)


 3958/35156 [==>...........................] - ETA: 1:58:33 - loss: 0.8521 - policy_loss: 1.3530 - value_loss: 0.6851 - policy_acc: 0.6199 - value_acc_round: 0.1780

  % delta_t_median)


 4084/35156 [==>...........................] - ETA: 1:58:02 - loss: 0.8531 - policy_loss: 1.3546 - value_loss: 0.6859 - policy_acc: 0.6197 - value_acc_round: 0.1768

  % delta_t_median)


 4109/35156 [==>...........................] - ETA: 1:58:00 - loss: 0.8530 - policy_loss: 1.3544 - value_loss: 0.6859 - policy_acc: 0.6197 - value_acc_round: 0.1767

  % delta_t_median)


 4162/35156 [==>...........................] - ETA: 1:57:52 - loss: 0.8528 - policy_loss: 1.3543 - value_loss: 0.6856 - policy_acc: 0.6197 - value_acc_round: 0.1767

  % delta_t_median)


 4167/35156 [==>...........................] - ETA: 1:57:52 - loss: 0.8527 - policy_loss: 1.3542 - value_loss: 0.6856 - policy_acc: 0.6198 - value_acc_round: 0.1767

  % delta_t_median)


 4170/35156 [==>...........................] - ETA: 1:57:52 - loss: 0.8527 - policy_loss: 1.3542 - value_loss: 0.6855 - policy_acc: 0.6198 - value_acc_round: 0.1767

  % delta_t_median)


 4171/35156 [==>...........................] - ETA: 1:57:53 - loss: 0.8527 - policy_loss: 1.3542 - value_loss: 0.6855 - policy_acc: 0.6198 - value_acc_round: 0.1768

  % delta_t_median)


 4174/35156 [==>...........................] - ETA: 1:57:55 - loss: 0.8527 - policy_loss: 1.3542 - value_loss: 0.6855 - policy_acc: 0.6198 - value_acc_round: 0.1768

  % delta_t_median)


 4178/35156 [==>...........................] - ETA: 1:57:55 - loss: 0.8525 - policy_loss: 1.3541 - value_loss: 0.6854 - policy_acc: 0.6198 - value_acc_round: 0.1769

  % delta_t_median)
  % delta_t_median)


 4211/35156 [==>...........................] - ETA: 1:57:46 - loss: 0.8527 - policy_loss: 1.3540 - value_loss: 0.6855 - policy_acc: 0.6198 - value_acc_round: 0.1771

  % delta_t_median)


 4320/35156 [==>...........................] - ETA: 1:57:16 - loss: 0.8523 - policy_loss: 1.3546 - value_loss: 0.6849 - policy_acc: 0.6196 - value_acc_round: 0.1781

  % delta_t_median)


 4323/35156 [==>...........................] - ETA: 1:57:15 - loss: 0.8524 - policy_loss: 1.3547 - value_loss: 0.6849 - policy_acc: 0.6196 - value_acc_round: 0.1781

  % delta_t_median)


 4614/35156 [==>...........................] - ETA: 1:56:07 - loss: 0.8520 - policy_loss: 1.3543 - value_loss: 0.6846 - policy_acc: 0.6196 - value_acc_round: 0.1780

  % delta_t_median)


 4698/35156 [===>..........................] - ETA: 1:55:56 - loss: 0.8516 - policy_loss: 1.3532 - value_loss: 0.6844 - policy_acc: 0.6198 - value_acc_round: 0.1783

  % delta_t_median)


 4912/35156 [===>..........................] - ETA: 1:55:01 - loss: 0.8515 - policy_loss: 1.3536 - value_loss: 0.6842 - policy_acc: 0.6195 - value_acc_round: 0.1788

  % delta_t_median)


 4951/35156 [===>..........................] - ETA: 1:54:52 - loss: 0.8516 - policy_loss: 1.3540 - value_loss: 0.6841 - policy_acc: 0.6194 - value_acc_round: 0.1787

  % delta_t_median)
  % delta_t_median)


 5384/35156 [===>..........................] - ETA: 1:53:09 - loss: 0.8518 - policy_loss: 1.3516 - value_loss: 0.6851 - policy_acc: 0.6200 - value_acc_round: 0.1773

  % delta_t_median)


 5530/35156 [===>..........................] - ETA: 1:52:43 - loss: 0.8515 - policy_loss: 1.3517 - value_loss: 0.6847 - policy_acc: 0.6199 - value_acc_round: 0.1779

  % delta_t_median)


 5545/35156 [===>..........................] - ETA: 1:52:43 - loss: 0.8513 - policy_loss: 1.3516 - value_loss: 0.6846 - policy_acc: 0.6199 - value_acc_round: 0.1779

  % delta_t_median)


 5668/35156 [===>..........................] - ETA: 1:52:19 - loss: 0.8516 - policy_loss: 1.3510 - value_loss: 0.6852 - policy_acc: 0.6200 - value_acc_round: 0.1772

  % delta_t_median)


 5671/35156 [===>..........................] - ETA: 1:52:20 - loss: 0.8516 - policy_loss: 1.3510 - value_loss: 0.6852 - policy_acc: 0.6200 - value_acc_round: 0.1771

  % delta_t_median)


 5758/35156 [===>..........................] - ETA: 1:51:57 - loss: 0.8517 - policy_loss: 1.3505 - value_loss: 0.6855 - policy_acc: 0.6201 - value_acc_round: 0.1767 ETA: 1:52:00 - loss: 0.8517 - policy_loss: 1.3506 - value_loss: 0

  % delta_t_median)


 5762/35156 [===>..........................] - ETA: 1:51:59 - loss: 0.8517 - policy_loss: 1.3505 - value_loss: 0.6855 - policy_acc: 0.6201 - value_acc_round: 0.1767

  % delta_t_median)


 5764/35156 [===>..........................] - ETA: 1:51:59 - loss: 0.8517 - policy_loss: 1.3505 - value_loss: 0.6855 - policy_acc: 0.6201 - value_acc_round: 0.1767

  % delta_t_median)


 6368/35156 [====>.........................] - ETA: 1:49:18 - loss: 0.8523 - policy_loss: 1.3533 - value_loss: 0.6852 - policy_acc: 0.6196 - value_acc_round: 0.1771

  % delta_t_median)


 6374/35156 [====>.........................] - ETA: 1:49:17 - loss: 0.8523 - policy_loss: 1.3534 - value_loss: 0.6853 - policy_acc: 0.6196 - value_acc_round: 0.1771

  % delta_t_median)


 6491/35156 [====>.........................] - ETA: 1:48:45 - loss: 0.8523 - policy_loss: 1.3537 - value_loss: 0.6851 - policy_acc: 0.6195 - value_acc_round: 0.1774

  % delta_t_median)


 6505/35156 [====>.........................] - ETA: 1:48:44 - loss: 0.8523 - policy_loss: 1.3537 - value_loss: 0.6852 - policy_acc: 0.6195 - value_acc_round: 0.1774

  % delta_t_median)


 6618/35156 [====>.........................] - ETA: 1:48:19 - loss: 0.8517 - policy_loss: 1.3534 - value_loss: 0.6844 - policy_acc: 0.6196 - value_acc_round: 0.1783

  % delta_t_median)


 6619/35156 [====>.........................] - ETA: 1:48:20 - loss: 0.8517 - policy_loss: 1.3534 - value_loss: 0.6844 - policy_acc: 0.6196 - value_acc_round: 0.1784

  % delta_t_median)


 6620/35156 [====>.........................] - ETA: 1:48:20 - loss: 0.8517 - policy_loss: 1.3534 - value_loss: 0.6844 - policy_acc: 0.6196 - value_acc_round: 0.1784

  % delta_t_median)


 6641/35156 [====>.........................] - ETA: 1:48:17 - loss: 0.8516 - policy_loss: 1.3533 - value_loss: 0.6844 - policy_acc: 0.6196 - value_acc_round: 0.1785

  % delta_t_median)


 6871/35156 [====>.........................] - ETA: 1:47:25 - loss: 0.8514 - policy_loss: 1.3542 - value_loss: 0.6838 - policy_acc: 0.6194 - value_acc_round: 0.1795

  % delta_t_median)


 6872/35156 [====>.........................] - ETA: 1:47:26 - loss: 0.8514 - policy_loss: 1.3542 - value_loss: 0.6838 - policy_acc: 0.6194 - value_acc_round: 0.1795

  % delta_t_median)


 6875/35156 [====>.........................] - ETA: 1:47:25 - loss: 0.8514 - policy_loss: 1.3542 - value_loss: 0.6839 - policy_acc: 0.6194 - value_acc_round: 0.1795

  % delta_t_median)


 6952/35156 [====>.........................] - ETA: 1:47:12 - loss: 0.8515 - policy_loss: 1.3543 - value_loss: 0.6840 - policy_acc: 0.6194 - value_acc_round: 0.1793

  % delta_t_median)


 6966/35156 [====>.........................] - ETA: 1:47:12 - loss: 0.8515 - policy_loss: 1.3542 - value_loss: 0.6840 - policy_acc: 0.6194 - value_acc_round: 0.1792

  % delta_t_median)


 7486/35156 [=====>........................] - ETA: 1:45:08 - loss: 0.8512 - policy_loss: 1.3541 - value_loss: 0.6836 - policy_acc: 0.6194 - value_acc_round: 0.1796 ETA: 1:45:08 - loss: 0.8512 - policy_loss: 1.3540 - value_loss: 0.6836 - policy_acc: 0.6194 - v

  % delta_t_median)


 7566/35156 [=====>........................] - ETA: 1:44:57 - loss: 0.8509 - policy_loss: 1.3538 - value_loss: 0.6833 - policy_acc: 0.6194 - value_acc_round: 0.1799

  % delta_t_median)


 7567/35156 [=====>........................] - ETA: 1:44:57 - loss: 0.8509 - policy_loss: 1.3538 - value_loss: 0.6833 - policy_acc: 0.6194 - value_acc_round: 0.1799

  % delta_t_median)


 7777/35156 [=====>........................] - ETA: 1:44:09 - loss: 0.8503 - policy_loss: 1.3520 - value_loss: 0.6831 - policy_acc: 0.6198 - value_acc_round: 0.1805

  % delta_t_median)


 7908/35156 [=====>........................] - ETA: 1:43:34 - loss: 0.8508 - policy_loss: 1.3526 - value_loss: 0.6835 - policy_acc: 0.6196 - value_acc_round: 0.1800

  % delta_t_median)


 8039/35156 [=====>........................] - ETA: 1:43:04 - loss: 0.8510 - policy_loss: 1.3526 - value_loss: 0.6838 - policy_acc: 0.6197 - value_acc_round: 0.1795

  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)



Epoch 00003: val_loss improved from 0.96251 to 0.90988, saving model to models/model-03.hdf5
Epoch:  3  - lr: 0.0008399954  - batch: 2  - epoch:  3
Epoch 4/5
    2/35156 [..............................] - ETA: 2:47:06 - loss: 0.7920 - policy_loss: 1.2217 - value_loss: 0.6488 - policy_acc: 0.6406 - value_acc_round: 0.1816

  % delta_t_median)
  % delta_t_median)


   94/35156 [..............................] - ETA: 2:18:13 - loss: 0.8330 - policy_loss: 1.2567 - value_loss: 0.6918 - policy_acc: 0.6394 - value_acc_round: 0.1719

  % delta_t_median)


   96/35156 [..............................] - ETA: 2:20:02 - loss: 0.8317 - policy_loss: 1.2551 - value_loss: 0.6906 - policy_acc: 0.6398 - value_acc_round: 0.1722

  % delta_t_median)


  249/35156 [..............................] - ETA: 2:19:46 - loss: 0.8256 - policy_loss: 1.2801 - value_loss: 0.6740 - policy_acc: 0.6323 - value_acc_round: 0.1839

  % delta_t_median)


  250/35156 [..............................] - ETA: 2:20:07 - loss: 0.8256 - policy_loss: 1.2799 - value_loss: 0.6742 - policy_acc: 0.6323 - value_acc_round: 0.1839

  % delta_t_median)


  358/35156 [..............................] - ETA: 2:17:19 - loss: 0.8341 - policy_loss: 1.2917 - value_loss: 0.6816 - policy_acc: 0.6307 - value_acc_round: 0.1823

  % delta_t_median)


  366/35156 [..............................] - ETA: 2:17:32 - loss: 0.8349 - policy_loss: 1.2923 - value_loss: 0.6824 - policy_acc: 0.6305 - value_acc_round: 0.1818

  % delta_t_median)


  400/35156 [..............................] - ETA: 2:18:09 - loss: 0.8356 - policy_loss: 1.2916 - value_loss: 0.6836 - policy_acc: 0.6310 - value_acc_round: 0.1807

  % delta_t_median)


  496/35156 [..............................] - ETA: 2:16:25 - loss: 0.8311 - policy_loss: 1.2892 - value_loss: 0.6784 - policy_acc: 0.6321 - value_acc_round: 0.1816

  % delta_t_median)


  503/35156 [..............................] - ETA: 2:16:55 - loss: 0.8320 - policy_loss: 1.2902 - value_loss: 0.6793 - policy_acc: 0.6318 - value_acc_round: 0.1816

  % delta_t_median)
  % delta_t_median)


  682/35156 [..............................] - ETA: 2:15:43 - loss: 0.8323 - policy_loss: 1.2889 - value_loss: 0.6801 - policy_acc: 0.6318 - value_acc_round: 0.1808

  % delta_t_median)


  754/35156 [..............................] - ETA: 2:15:47 - loss: 0.8314 - policy_loss: 1.2836 - value_loss: 0.6807 - policy_acc: 0.6326 - value_acc_round: 0.1805

  % delta_t_median)


  959/35156 [..............................] - ETA: 2:14:08 - loss: 0.8298 - policy_loss: 1.2829 - value_loss: 0.6788 - policy_acc: 0.6321 - value_acc_round: 0.1816

  % delta_t_median)


 1259/35156 [>.............................] - ETA: 2:11:36 - loss: 0.8290 - policy_loss: 1.2725 - value_loss: 0.6811 - policy_acc: 0.6345 - value_acc_round: 0.1805

  % delta_t_median)


 1260/35156 [>.............................] - ETA: 2:11:42 - loss: 0.8290 - policy_loss: 1.2725 - value_loss: 0.6811 - policy_acc: 0.6345 - value_acc_round: 0.1805

  % delta_t_median)


 1402/35156 [>.............................] - ETA: 2:11:00 - loss: 0.8255 - policy_loss: 1.2673 - value_loss: 0.6783 - policy_acc: 0.6357 - value_acc_round: 0.1837

  % delta_t_median)


 1538/35156 [>.............................] - ETA: 2:10:34 - loss: 0.8254 - policy_loss: 1.2684 - value_loss: 0.6777 - policy_acc: 0.6356 - value_acc_round: 0.1850

  % delta_t_median)


 2327/35156 [>.............................] - ETA: 2:05:59 - loss: 0.8275 - policy_loss: 1.2699 - value_loss: 0.6800 - policy_acc: 0.6358 - value_acc_round: 0.1829

  % delta_t_median)


 2388/35156 [=>............................] - ETA: 2:05:41 - loss: 0.8277 - policy_loss: 1.2707 - value_loss: 0.6801 - policy_acc: 0.6356 - value_acc_round: 0.1828

  % delta_t_median)


 2564/35156 [=>............................] - ETA: 2:05:00 - loss: 0.8273 - policy_loss: 1.2724 - value_loss: 0.6790 - policy_acc: 0.6353 - value_acc_round: 0.1838

  % delta_t_median)


 3050/35156 [=>............................] - ETA: 2:03:17 - loss: 0.8289 - policy_loss: 1.2706 - value_loss: 0.6817 - policy_acc: 0.6357 - value_acc_round: 0.1805

  % delta_t_median)


 3052/35156 [=>............................] - ETA: 2:03:15 - loss: 0.8289 - policy_loss: 1.2707 - value_loss: 0.6816 - policy_acc: 0.6356 - value_acc_round: 0.1805

  % delta_t_median)


 3338/35156 [=>............................] - ETA: 2:02:02 - loss: 0.8285 - policy_loss: 1.2733 - value_loss: 0.6803 - policy_acc: 0.6352 - value_acc_round: 0.1818

  % delta_t_median)


 3340/35156 [=>............................] - ETA: 2:02:03 - loss: 0.8285 - policy_loss: 1.2733 - value_loss: 0.6803 - policy_acc: 0.6351 - value_acc_round: 0.1818

  % delta_t_median)


 3548/35156 [==>...........................] - ETA: 2:01:17 - loss: 0.8281 - policy_loss: 1.2742 - value_loss: 0.6794 - policy_acc: 0.6348 - value_acc_round: 0.1829

  % delta_t_median)


 3663/35156 [==>...........................] - ETA: 2:01:04 - loss: 0.8289 - policy_loss: 1.2745 - value_loss: 0.6803 - policy_acc: 0.6348 - value_acc_round: 0.1828

  % delta_t_median)


 3787/35156 [==>...........................] - ETA: 2:00:30 - loss: 0.8286 - policy_loss: 1.2743 - value_loss: 0.6801 - policy_acc: 0.6349 - value_acc_round: 0.1828

  % delta_t_median)


 3834/35156 [==>...........................] - ETA: 2:00:28 - loss: 0.8289 - policy_loss: 1.2747 - value_loss: 0.6803 - policy_acc: 0.6349 - value_acc_round: 0.1826

  % delta_t_median)


 4026/35156 [==>...........................] - ETA: 2:00:05 - loss: 0.8291 - policy_loss: 1.2738 - value_loss: 0.6809 - policy_acc: 0.6351 - value_acc_round: 0.1817

  % delta_t_median)


 4030/35156 [==>...........................] - ETA: 2:00:06 - loss: 0.8291 - policy_loss: 1.2737 - value_loss: 0.6809 - policy_acc: 0.6351 - value_acc_round: 0.1817

  % delta_t_median)


 4249/35156 [==>...........................] - ETA: 1:59:21 - loss: 0.8284 - policy_loss: 1.2730 - value_loss: 0.6802 - policy_acc: 0.6354 - value_acc_round: 0.1826

  % delta_t_median)


 4341/35156 [==>...........................] - ETA: 1:59:13 - loss: 0.8281 - policy_loss: 1.2720 - value_loss: 0.6802 - policy_acc: 0.6356 - value_acc_round: 0.1826

  % delta_t_median)


 4640/35156 [==>...........................] - ETA: 1:57:55 - loss: 0.8279 - policy_loss: 1.2723 - value_loss: 0.6798 - policy_acc: 0.6355 - value_acc_round: 0.1829

  % delta_t_median)


 4645/35156 [==>...........................] - ETA: 1:57:55 - loss: 0.8280 - policy_loss: 1.2724 - value_loss: 0.6798 - policy_acc: 0.6355 - value_acc_round: 0.1829

  % delta_t_median)


 4842/35156 [===>..........................] - ETA: 1:57:14 - loss: 0.8283 - policy_loss: 1.2731 - value_loss: 0.6800 - policy_acc: 0.6355 - value_acc_round: 0.1833

  % delta_t_median)


 5041/35156 [===>..........................] - ETA: 1:56:33 - loss: 0.8288 - policy_loss: 1.2720 - value_loss: 0.6810 - policy_acc: 0.6357 - value_acc_round: 0.1822

  % delta_t_median)


 5045/35156 [===>..........................] - ETA: 1:56:33 - loss: 0.8287 - policy_loss: 1.2719 - value_loss: 0.6810 - policy_acc: 0.6357 - value_acc_round: 0.1821

  % delta_t_median)


 5318/35156 [===>..........................] - ETA: 1:55:37 - loss: 0.8284 - policy_loss: 1.2712 - value_loss: 0.6808 - policy_acc: 0.6358 - value_acc_round: 0.1823

  % delta_t_median)


 5320/35156 [===>..........................] - ETA: 1:55:37 - loss: 0.8284 - policy_loss: 1.2712 - value_loss: 0.6808 - policy_acc: 0.6358 - value_acc_round: 0.1823

  % delta_t_median)


 5778/35156 [===>..........................] - ETA: 1:53:28 - loss: 0.8286 - policy_loss: 1.2726 - value_loss: 0.6806 - policy_acc: 0.6355 - value_acc_round: 0.1825

  % delta_t_median)


 5781/35156 [===>..........................] - ETA: 1:53:29 - loss: 0.8286 - policy_loss: 1.2726 - value_loss: 0.6806 - policy_acc: 0.6355 - value_acc_round: 0.1826

  % delta_t_median)


 5883/35156 [====>.........................] - ETA: 1:53:03 - loss: 0.8290 - policy_loss: 1.2731 - value_loss: 0.6810 - policy_acc: 0.6355 - value_acc_round: 0.1825

  % delta_t_median)


 5889/35156 [====>.........................] - ETA: 1:53:02 - loss: 0.8291 - policy_loss: 1.2732 - value_loss: 0.6810 - policy_acc: 0.6354 - value_acc_round: 0.1825

  % delta_t_median)


 6021/35156 [====>.........................] - ETA: 1:52:40 - loss: 0.8293 - policy_loss: 1.2735 - value_loss: 0.6812 - policy_acc: 0.6353 - value_acc_round: 0.1823

  % delta_t_median)


 6022/35156 [====>.........................] - ETA: 1:52:40 - loss: 0.8293 - policy_loss: 1.2735 - value_loss: 0.6812 - policy_acc: 0.6353 - value_acc_round: 0.1823

  % delta_t_median)


 6023/35156 [====>.........................] - ETA: 1:52:41 - loss: 0.8293 - policy_loss: 1.2735 - value_loss: 0.6812 - policy_acc: 0.6353 - value_acc_round: 0.1823

  % delta_t_median)


 6026/35156 [====>.........................] - ETA: 1:52:40 - loss: 0.8293 - policy_loss: 1.2735 - value_loss: 0.6812 - policy_acc: 0.6353 - value_acc_round: 0.1822

  % delta_t_median)
  % delta_t_median)


 6112/35156 [====>.........................] - ETA: 1:52:17 - loss: 0.8294 - policy_loss: 1.2737 - value_loss: 0.6813 - policy_acc: 0.6353 - value_acc_round: 0.1821

  % delta_t_median)


 6115/35156 [====>.........................] - ETA: 1:52:17 - loss: 0.8294 - policy_loss: 1.2736 - value_loss: 0.6814 - policy_acc: 0.6353 - value_acc_round: 0.1821

  % delta_t_median)


 6315/35156 [====>.........................] - ETA: 1:51:38 - loss: 0.8299 - policy_loss: 1.2742 - value_loss: 0.6818 - policy_acc: 0.6351 - value_acc_round: 0.1814

  % delta_t_median)


 6583/35156 [====>.........................] - ETA: 1:50:37 - loss: 0.8295 - policy_loss: 1.2731 - value_loss: 0.6816 - policy_acc: 0.6352 - value_acc_round: 0.1813

  % delta_t_median)


 7072/35156 [=====>........................] - ETA: 1:48:47 - loss: 0.8289 - policy_loss: 1.2720 - value_loss: 0.6812 - policy_acc: 0.6355 - value_acc_round: 0.1818

  % delta_t_median)


 7167/35156 [=====>........................] - ETA: 1:48:21 - loss: 0.8288 - policy_loss: 1.2723 - value_loss: 0.6810 - policy_acc: 0.6354 - value_acc_round: 0.1822 ETA: 1:48:28 - loss: 0.8289 - policy_loss: 1.2720

  % delta_t_median)


 7300/35156 [=====>........................] - ETA: 1:47:52 - loss: 0.8295 - policy_loss: 1.2733 - value_loss: 0.6815 - policy_acc: 0.6351 - value_acc_round: 0.1821

  % delta_t_median)


 7332/35156 [=====>........................] - ETA: 1:47:50 - loss: 0.8296 - policy_loss: 1.2734 - value_loss: 0.6816 - policy_acc: 0.6352 - value_acc_round: 0.1819

  % delta_t_median)


 7334/35156 [=====>........................] - ETA: 1:47:50 - loss: 0.8296 - policy_loss: 1.2734 - value_loss: 0.6817 - policy_acc: 0.6352 - value_acc_round: 0.1819

  % delta_t_median)


 7335/35156 [=====>........................] - ETA: 1:47:51 - loss: 0.8296 - policy_loss: 1.2734 - value_loss: 0.6817 - policy_acc: 0.6352 - value_acc_round: 0.1819

  % delta_t_median)


 7337/35156 [=====>........................] - ETA: 1:47:51 - loss: 0.8296 - policy_loss: 1.2734 - value_loss: 0.6817 - policy_acc: 0.6352 - value_acc_round: 0.1818

  % delta_t_median)


 7340/35156 [=====>........................] - ETA: 1:47:50 - loss: 0.8296 - policy_loss: 1.2734 - value_loss: 0.6817 - policy_acc: 0.6352 - value_acc_round: 0.1818

  % delta_t_median)


 7746/35156 [=====>........................] - ETA: 1:46:13 - loss: 0.8298 - policy_loss: 1.2730 - value_loss: 0.6821 - policy_acc: 0.6352 - value_acc_round: 0.1808

  % delta_t_median)


 7903/35156 [=====>........................] - ETA: 1:45:40 - loss: 0.8298 - policy_loss: 1.2723 - value_loss: 0.6823 - policy_acc: 0.6354 - value_acc_round: 0.1803

  % delta_t_median)


 7905/35156 [=====>........................] - ETA: 1:45:40 - loss: 0.8298 - policy_loss: 1.2723 - value_loss: 0.6823 - policy_acc: 0.6354 - value_acc_round: 0.1803

  % delta_t_median)


 7909/35156 [=====>........................] - ETA: 1:45:40 - loss: 0.8298 - policy_loss: 1.2723 - value_loss: 0.6823 - policy_acc: 0.6355 - value_acc_round: 0.1803

  % delta_t_median)


 7942/35156 [=====>........................] - ETA: 1:45:33 - loss: 0.8296 - policy_loss: 1.2721 - value_loss: 0.6821 - policy_acc: 0.6355 - value_acc_round: 0.1804

  % delta_t_median)


 7986/35156 [=====>........................] - ETA: 1:45:24 - loss: 0.8295 - policy_loss: 1.2716 - value_loss: 0.6821 - policy_acc: 0.6356 - value_acc_round: 0.1804

  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)
  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




  % delta_t_median)




In [None]:
# model.save('models\\BughouseNet220620190437.h5')
history = model.fit_generator(generator(batch_size,len(train_ids),path=dataset_path), steps_per_epoch=int((len(train_ids)*zip_length)/batch_size), callbacks=callbacks_list,
                    epochs=epochs, validation_data=(x_val, [policies_val,values_val]))


In [None]:
# model.save('models\\BughouseNet220620190437.h5')
history = model.fit_generator(generator(batch_size,len(train_ids),path=dataset_path), steps_per_epoch=int((len(train_ids)*zip_length)/batch_size), callbacks=callbacks_list,
                    epochs=epochs, validation_data=(x_val, [policies_val,values_val]))


In [None]:
# model.save('models\\BughouseNet220620190437.h5')
history = model.fit_generator(generator(batch_size,len(train_ids),path=dataset_path), steps_per_epoch=int((len(train_ids)*zip_length)/batch_size), callbacks=callbacks_list,
                    epochs=epochs, validation_data=(x_val, [policies_val,values_val]))


In [None]:
# model.save('models\\BughouseNet220620190437.h5')
history = model.fit_generator(generator(batch_size,len(train_ids),path=dataset_path), steps_per_epoch=int((len(train_ids)*zip_length)/batch_size), callbacks=callbacks_list,
                    epochs=epochs, validation_data=(x_val, [policies_val,values_val]))


In [None]:
# model.save('models\\BughouseNet220620190437.h5')
history = model.fit_generator(generator(batch_size,len(train_ids),path=dataset_path), steps_per_epoch=int((len(train_ids)*zip_length)/batch_size), callbacks=callbacks_list,
                    epochs=epochs, validation_data=(x_val, [policies_val,values_val]))


In [None]:
# model.save('models\\BughouseNet220620190437.h5')
history = model.fit_generator(generator(batch_size,len(train_ids),path=dataset_path), steps_per_epoch=int((len(train_ids)*zip_length)/batch_size), callbacks=callbacks_list,
                    epochs=epochs, validation_data=(x_val, [policies_val,values_val]))


In [None]:
plotHistory(history)


<h3>MNist overfitting</h3>

In [None]:
def getResidualNetwork(input_shape):
    
    channel_pos = 'channels_first'
    inp_shape = Input(input_shape,name='input1')
    x = Conv2D(256, kernel_size=(3,3), padding = 'same', input_shape=input_shape,data_format=channel_pos,name='conv2d_1')(inp_shape)
    x = BatchNormalization(axis=1,name='batch_normalization_1')(x)
    x_a1 = Activation('relu',name='activation_1')(x)

    x = Conv2D(256, kernel_size=(3,3),name ='conv2d_2' ,padding = 'same',data_format=channel_pos)(x_a1)
    x = BatchNormalization(axis=1, name = 'batch_normalization_2')(x)
    x = Activation('relu',name = 'activation_2')(x)
    x = Conv2D(256, kernel_size=(3,3), name = 'conv2d_3',padding = 'same',data_format=channel_pos)(x)
    x = BatchNormalization(axis=1, name = 'batch_normalization_3')(x)

    x = keras.layers.add([x,x_a1],name='add1')
    x_a2 = Activation('relu',name='activation_3')(x)
    x = Conv2D(256, kernel_size=(3,3),name = 'conv2d_4', padding = 'same',data_format=channel_pos)(x_a2)
    x = BatchNormalization(axis=1,name = 'batch_normalization_4')(x)
    x = Activation('relu',name='activation_4')(x)
    x = Conv2D(256, kernel_size=(3,3), name='conv2d_5',padding = 'same',data_format=channel_pos)(x)
    x = BatchNormalization(axis=1,name='batch_normalization_5')(x)

    x = keras.layers.add([x,x_a2],name='add_2')
    x_a3 = Activation('relu',name='activation_5')(x)
    x = Conv2D(256, kernel_size=(3,3),name='conv2d_6', padding = 'same',data_format=channel_pos)(x_a3)
    x = BatchNormalization(axis=1,name='batch_normalization_6')(x)
    x = Activation('relu',name='activation_6')(x)
    x = Conv2D(256, kernel_size=(3,3), name='conv2d_7',padding = 'same',data_format=channel_pos)(x)
    x = BatchNormalization(axis=1,name='batch_normalization_7')(x)

    x = keras.layers.add([x,x_a3],name='add_3')
    x_a4 = Activation('relu',name='activation_7')(x)
    x = Conv2D(256, kernel_size=(3,3), name = 'conv2d_8',padding = 'same',data_format=channel_pos)(x_a4)
    x = BatchNormalization(axis=1,name='batch_normalization_8')(x)
    x = Activation('relu',name='activation_8')(x)
    x = Conv2D(256, kernel_size=(3,3), name='conv2d_9',padding = 'same',data_format=channel_pos)(x)
    x = BatchNormalization(axis=1,name='batch_normalization_9')(x)

    x = keras.layers.add([x,x_a4],name='add4')
    x_a5 = Activation('relu',name='activation_9')(x)
    x = Conv2D(256, kernel_size=(3,3),name='conv2d_10', padding = 'same',data_format=channel_pos)(x_a5)
    x = BatchNormalization(axis=1,name='batch_normalization_10')(x)
    x = Activation('relu',name='activation_10')(x)
    x = Conv2D(256, kernel_size=(3,3),name='conv2d_11', padding = 'same',data_format=channel_pos)(x)
    x = BatchNormalization(axis=1,name='batch_normalization_11')(x)

    x = keras.layers.add([x,x_a5],name='add_5')
    x_a6 = Activation('relu',name='activation_11')(x)
    x = Conv2D(256, kernel_size=(3,3), name='conv2d_12',padding = 'same',data_format=channel_pos)(x_a6)
    x = BatchNormalization(axis=1,name='batch_normalization_12')(x)
    x = Activation('relu',name='activation_12')(x)
    x = Conv2D(256, kernel_size=(3,3), name='conv2d_13',padding = 'same',data_format=channel_pos)(x)
    x = BatchNormalization(axis=1,name='batch_normalization_13')(x)

    x = keras.layers.add([x,x_a6],name='add6')
    x_a7 = Activation('relu',name='activation_13')(x)
    x = Conv2D(256, kernel_size=(3,3), name='conv2d_14',padding = 'same',data_format=channel_pos)(x_a7)
    x = BatchNormalization(axis=1,name='batch_normalization_14')(x)
    x = Activation('relu',name='activation_14')(x)
    x = Conv2D(256, kernel_size=(3,3), name='conv2d_15',padding = 'same',data_format=channel_pos)(x)
    x = BatchNormalization(axis=1,name='batch_normalization_15')(x)

    x = keras.layers.add([x,x_a7],name='add_7')
    x_a8 = Activation('relu',name='activation_15')(x)
    x = Conv2D(1, kernel_size=(1,1),name='conv2d_17', padding = 'same',data_format=channel_pos)(x_a8)
    xb = BatchNormalization(axis=1,name='batch_normalization_17')(x)
    xConv = Conv2D(8, kernel_size=(7,7), padding = 'same',name='conv2d_16',data_format=channel_pos)(x_a8)
    xA = Activation('relu',name='activation_17')(xb)
    xb = BatchNormalization(axis=1,name='batch_normalization_16')(xConv)
    xF = Flatten(name='flatten_2')(xA)
    xA = Activation('relu',name='activation_16')(xb)

    dense_1 = Dense(256, activation='relu',name='dense_1')(xF)
    xF = Flatten(name='flatten_1')(xA)

    value = Dense(1, activation='tanh', name='value')(dense_1)
    policy = Dense(10, activation='softmax', name='policy')(xF)

    from keras.models import Model
    model = Model(inp_shape, [policy])

    model.summary()
    return model

In [None]:
from keras.datasets import mnist
img_rows, img_cols = 28, 28
num_classes = 10
(x_train, y_train), (x_test, y_test) = mnist.load_data()
x_train = x_train.reshape(x_train.shape[0], img_rows, img_cols, 1)
x_test = x_test.reshape(x_test.shape[0], img_rows, img_cols, 1)
input_shape = (img_rows, img_cols, 1)
x_train = x_train.astype('float32')
x_test = x_test.astype('float32')
x_train /= 255
x_test /= 255
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

In [None]:
from  LearningRateScheduler import *
data_len = len(x_train)
epochs = 20
batch_len = epochs * int(data_len/ (batch_size))
max_lr = 0.001*8
total_it = batch_len
min_lr = 0.0001
print('BatchLen: ', batch_len, ' - DataLen: ', data_len)
lr_schedule = OneCycleSchedule(start_lr=max_lr/8, max_lr=max_lr, cycle_length=total_it*.4, cooldown_length=total_it*.6, finish_lr=min_lr)
scheduler = LinearWarmUp(lr_schedule, start_lr=min_lr, length=total_it/30)
bt = BatchLearningRateScheduler(scheduler)

In [None]:
model = getResidualNetwork(input_shape)
sgd = optimizers.SGD(lr=0.000, momentum=0.9, decay=0.0, nesterov=False)

def acc_reg(y_true,y_pred):
    return K.constant(1) - K.square(K.mean((y_pred-y_true), axis=1))
callbacks_list = [bt]

model.compile(loss=['categorical_crossentropy'], optimizer=sgd,
              metrics=['accuracy'])
# model.fit(x_train, y_train,
#           batch_size=batch_size,
#           epochs=epochs,
#           verbose=1,
#           validation_data=(x_test, y_test),
#          callbacks=callbacks_list)
