In [1]:
import shutup
shutup.please()

In [34]:
import gfootball.env as football_env
import numpy as np

import gym
import copy
import tensorflow as tf

from keras.callbacks import TensorBoard
from keras.layers import Input, Dense, Conv1D,Conv2D, MaxPooling2D,MaxPooling1D, LSTM, Flatten
from keras.models import Model
from tensorflow.keras.optimizers import Adam
from keras import backend as K
from keras.applications.mobilenet_v2 import MobileNetV2
from tensorflow.python.framework.ops import disable_eager_execution

disable_eager_execution()

clipping_val = 0.2
critic_discount = 0.5
entropy_beta = 0.001
gamma = 0.99
lmbda = 0.95


env = gym.make('CartPole-v1')
    
state = env.reset()
state_dims = env.observation_space.shape

state_size = state_dims
n_actions = env.action_space.n
action_space = n_actions
input_shape = env.observation_space.shape

dummy_n = np.zeros((1, 1, n_actions))
dummy_1 = np.zeros((1, 1, 1))

tensor_board = TensorBoard(log_dir='./logs/ppo')


target_reached = False
best_reward = 0
iters = 0
max_iters = 50
training_batch=1000
episode = 0
replay_count = 0
shuffle = False
epochs = 10



def get_advantages(values, masks, rewards):
    returns = []
    gae = 0
    for i in reversed(range(len(rewards))):
        delta = rewards[i] + gamma * values[i + 1] * masks[i] - values[i]
        gae = delta + gamma * lmbda * masks[i] * gae
        returns.insert(0, gae + values[i])

    adv = np.array(returns) - values[:-1]
    return returns, (adv - np.mean(adv)) / (np.std(adv) + 1e-10)

def critic_PPO2_loss(values):
    def loss(y_true, y_pred):
        LOSS_CLIPPING = clipping_val
        clipped_value_loss = values + K.clip(y_pred - values, -LOSS_CLIPPING, LOSS_CLIPPING)
        v_loss1 = (y_true - clipped_value_loss) ** 2
        v_loss2 = (y_true - y_pred) ** 2
            
        value_loss = 0.5 * K.mean(K.maximum(v_loss1, v_loss2))
        #value_loss = K.mean((y_true - y_pred) ** 2) # standard PPO loss
        return value_loss
    return loss

def ppo_loss(y_true, y_pred):
    # Defined in https://arxiv.org/abs/1707.06347
    advantages, prediction_picks, actions = y_true[:, :1], y_true[:, 1:1+action_space], y_true[:, 1+action_space:]
    LOSS_CLIPPING = clipping_val
    ENTROPY_LOSS = entropy_beta
        
    prob = actions * y_pred
    old_prob = actions * prediction_picks

    prob = K.clip(prob, 1e-10, 1.0)
    old_prob = K.clip(old_prob, 1e-10, 1.0)

    ratio = K.exp(K.log(prob) - K.log(old_prob))
        
    p1 = ratio * advantages
    p2 = K.clip(ratio, min_value=1 - LOSS_CLIPPING, max_value=1 + LOSS_CLIPPING) * advantages

    actor_loss = -K.mean(K.minimum(p1, p2))

    entropy = -(y_pred * K.log(y_pred + 1e-10))
    entropy = ENTROPY_LOSS * K.mean(entropy)
        
    total_loss = actor_loss - entropy

    return total_loss

def get_common_layer(X_input, model="MLP"):
    # Shared CNN layers:
    if model=="CNN":
        X = Conv1D(filters=64, kernel_size=6, padding="same", activation="tanh")(X_input)
        X = MaxPooling1D(pool_size=2)(X)
        X = Conv1D(filters=32, kernel_size=3, padding="same", activation="tanh")(X)
        X = MaxPooling1D(pool_size=2)(X)
        X = Flatten()(X)

    # Shared LSTM layers:
    elif model=="LSTM":
        X = LSTM(512, return_sequences=True)(X_input)
        X = LSTM(256)(X)

    # Shared Dense layers:
    else:
        X = Flatten()(X_input)
        X = Dense(512, activation="relu")(X)
        
    return X

def get_model_actor_simple(input_shape=input_shape, n_actions=n_actions):

    X_input = Input(input_shape)

    X = get_common_layer(X_input)
    X = Dense(512, activation="relu", kernel_initializer=tf.random_normal_initializer(stddev=0.01))(X_input)
    X = Dense(256, activation="relu", kernel_initializer=tf.random_normal_initializer(stddev=0.01))(X)
    X = Dense(64, activation="relu", kernel_initializer=tf.random_normal_initializer(stddev=0.01))(X)
    output = Dense(n_actions, activation="softmax")(X)

    model = Model(inputs = X_input, outputs = output)
    model.compile(loss=ppo_loss, optimizer=Adam(lr=0.00025))
    return model


def get_model_critic_simple(input_shape=input_shape):
    X_input = Input(input_shape)
    old_values = Input(shape=(1,))
    
    X = get_common_layer(X_input)
    V = Dense(512, activation="relu", kernel_initializer='he_uniform')(X_input)
    V = Dense(256, activation="relu", kernel_initializer='he_uniform')(V)
    V = Dense(64, activation="relu", kernel_initializer='he_uniform')(V)
    value = Dense(1, activation=None)(V)

    model = Model(inputs=[X_input, old_values], outputs = value)
    model.compile(loss=[critic_PPO2_loss(old_values)], optimizer=Adam(lr=0.00025))
    return model
    
actor = get_model_actor_simple()
critic = get_model_critic_simple()

def act(state):
    """ example:
    pred = np.array([0.05, 0.85, 0.1])
    action_size = 3
    np.random.choice(a, p=pred)
    result>>> 1, because it have the highest probability to be taken
    """
    # Use the network to predict the next action to take, using the model
    prediction = actor.predict(state)[0]
    action = np.random.choice(n_actions, p=prediction)
    action_onehot = np.zeros([n_actions])
    action_onehot[action] = 1
    return action, action_onehot, prediction

def discount_rewards(reward):#gaes is better
    # Compute the gamma-discounted rewards over an episode
    # We apply the discount and normalize it to avoid big variability of rewards
    gamma = 0.99    # discount rate
    running_add = 0
    discounted_r = np.zeros_like(reward)
    for i in reversed(range(0,len(reward))):
        running_add = running_add * gamma + reward[i]
        discounted_r[i] = running_add

    discounted_r -= np.mean(discounted_r) # normalizing the result
    discounted_r /= (np.std(discounted_r) + 1e-8) # divide by standard deviation
    return discounted_r

def get_gaes(rewards, dones, values, next_values, gamma = 0.99, lamda = 0.9, normalize=True):
    deltas = [r + gamma * (1 - d) * nv - v for r, d, nv, v in zip(rewards, dones, next_values, values)]
    deltas = np.stack(deltas)
    gaes = copy.deepcopy(deltas)
    for t in reversed(range(len(deltas) - 1)):
        gaes[t] = gaes[t] + (1 - dones[t]) * gamma * lamda * gaes[t + 1]

    target = gaes + values
    if normalize:
        gaes = (gaes - gaes.mean()) / (gaes.std() + 1e-8)
    return np.vstack(gaes), np.vstack(target)

def test_reward():
    state = env.reset()
    done = False
    total_reward = 0
   
    limit = 0
    while not done:
        state_input = K.expand_dims(state, 0)
        action_probs = model_actor.predict([state_input, dummy_n, dummy_1, dummy_1, dummy_1], steps=1)
        action = np.argmax(action_probs)
        next_state, reward, done, _ = env.step(action)
        state = next_state
        total_reward += reward
        #print('test reward',reward)
        limit += 1
        if limit > 20:
            break
    print('testing...', total_reward)
    return total_reward

def critic_predict(state):
    return critic.predict([state, np.zeros((state.shape[0], 1))])

def replay(states, actions, rewards, predictions, dones, next_states):
    # reshape memory to appropriate shape for training
    states = np.vstack(states)
    next_states = np.vstack(next_states)
    actions = np.vstack(actions)
    predictions = np.vstack(predictions)

    # Get Critic network predictions 
    values = critic_predict(states)
    next_values = critic_predict(next_states)

    # Compute discounted rewards and advantages
    #discounted_r = self.discount_rewards(rewards)
    #advantages = np.vstack(discounted_r - values)
    advantages, target = get_gaes(rewards, dones, np.squeeze(values), np.squeeze(next_values))
    '''
        pylab.plot(advantages,'.')
        pylab.plot(target,'-')
        ax=pylab.gca()
        ax.grid(True)
        pylab.subplots_adjust(left=0.05, right=0.98, top=0.96, bottom=0.06)
        pylab.show()
        '''
    # stack everything to numpy array
    # pack all advantages, predictions and actions to y_true and when they are received
    # in custom PPO loss function we unpack it
    y_true = np.hstack([advantages, predictions, actions])
        
    # training Actor and Critic networks
    print()
 
    a_loss = actor.fit(states, y_true, epochs=epochs, verbose=0, shuffle=shuffle,callbacks=[tensor_board])
    print('actor loss',np.mean(a_loss.history['loss']))
    print()

    c_loss = critic.fit([states, values], target, epochs=epochs, verbose=0, shuffle=shuffle,callbacks=[tensor_board])
    print('critic loss',np.mean(c_loss.history['loss']))
    print()
#     self.writer.add_scalar('Data/actor_loss_per_replay', np.sum(a_loss.history['loss']), self.replay_count)
#     self.writer.add_scalar('Data/critic_loss_per_replay', np.sum(c_loss.history['loss']), self.replay_count)
#     self.replay_count += 1
    #replay_count += 1

def run_batch(): # train every self.Training_batch episodes
    scores_ = []
    episodes_ = []
    averages_= [] 
    episode = 0
    state = env.reset()
    state = np.reshape(state, [1,state_size[0]])
    done, score, SAVING = False, 0, ''
    while True:
        # Instantiate or reset games memory
        states, next_states, actions, rewards, predictions, dones = [], [], [], [], [], []
        for t in range(training_batch):
           # env.render()
            # Actor picks an action
            action, action_onehot, prediction = act(state)
                # Retrieve new state, reward, and whether the state is terminal
            next_state, reward, done, _ = env.step(action)
            # Memorize (state, action, reward) for training
            states.append(state)
            next_states.append(np.reshape(next_state, [1, state_size[0]]))
            actions.append(action_onehot)
            rewards.append(reward)
            dones.append(done)
            predictions.append(prediction)
            # Update current state
            state = np.reshape(next_state, [1, state_size[0]])
            score += reward
            if done:
                episode += 1
                SAVING = False
                scores_.append(score)
                averages_.append(sum(scores_[-50:]) / len(scores_[-50:]))

                print('score', averages_[-1])
#                     average, SAVING = self.PlotModel(score, self.episode)
#                     print("episode: {}/{}, score: {}, average: {:.2f} {}".format(self.episode, self.EPISODES, score, average, SAVING))
#                     self.writer.add_scalar(f'Workers:{1}/score_per_episode', score, self.episode)
#                     self.writer.add_scalar(f'Workers:{1}/learning_rate', self.lr, self.episode)

                state, done, score, SAVING = env.reset(), False, 0, ''
                state = np.reshape(state, [1, state_size[0]])
   
        replay(states, actions, rewards, predictions, dones, next_states)
        if episode >= 1000:
            break
    env.close()  




In [None]:

run_batch() # train as PPO, train every epesode

score 22.0
score 16.5
score 16.666666666666668
score 20.75
score 19.0
score 19.166666666666668
score 18.0
score 18.5
score 17.666666666666668
score 17.2
score 16.818181818181817
score 16.916666666666668
score 16.615384615384617
score 17.071428571428573
score 16.666666666666668
score 16.5
score 16.058823529411764
score 16.22222222222222
score 16.157894736842106
score 15.95
score 15.904761904761905
score 15.818181818181818
score 19.304347826086957
score 19.666666666666668
score 19.68
score 19.807692307692307
score 19.555555555555557
score 19.857142857142858
score 19.482758620689655
score 19.533333333333335
score 20.161290322580644
score 20.03125
score 19.87878787878788
score 21.205882352941178
score 20.857142857142858
score 20.75
score 20.64864864864865
score 20.55263157894737
score 21.28205128205128
score 21.1
score 21.341463414634145
score 21.547619047619047
score 21.41860465116279
score 21.568181818181817

actor loss -0.0016584679361432788

critic loss 21.133027598190306

score 22.422

score 142.94
score 142.48
score 141.64
score 141.08

actor loss -0.0031194844007492064

critic loss 8.526541491037609

score 140.78
score 140.6
score 140.18
score 140.64
score 140.72
score 140.54
score 139.86
score 138.6

actor loss -0.0007027521863579753

critic loss 6.278349852490425

score 138.46
score 138.44
score 138.08
score 138.04
score 137.4
score 136.68
score 135.44

actor loss -0.0025336498111486433

critic loss 20.23406697661877

score 135.68
score 135.58
score 135.72
score 135.44
score 135.82
score 135.06
score 135.48
score 134.64

actor loss -0.008172056594491005

critic loss 3.3590894218683247

score 134.14
score 133.58
score 133.34
score 133.04
score 132.68
score 132.04
score 131.02
score 130.92
score 129.94

actor loss -0.00865372121334076

critic loss 49.75200191123486

score 129.5
score 128.66
score 128.26
score 127.14
score 126.14
score 124.98
score 124.48
score 123.64
score 123.4

actor loss -0.003534095054864883

critic loss 34.85055758814811

score 123.3
score 122

score 367.92
score 367.58

actor loss -0.0018830804228782655

critic loss 139.94803047971726

score 368.44
score 367.5
score 364.52

actor loss 0.0020881664514541625

critic loss 131.60276443000436

score 368.36
score 369.48

actor loss -0.004473009253293276

critic loss 91.05802854450943

score 364.58
score 369.38
score 370.3

actor loss -3.712711334228516e-05

critic loss 83.91595963530987

score 370.86
score 368.84
score 370.52

actor loss -0.0038650727480649947

critic loss 79.05908633623125

score 364.64
score 363.54
score 362.4
score 362.6

actor loss -0.002189671993255615

critic loss 97.13642079784869

score 363.68
score 364.68
score 364.12

actor loss -0.006671660780906677

critic loss 84.1121640732646

score 364.12
score 360.98
score 361.78
score 362.36

actor loss -0.0037179814934730528

critic loss 79.55639806842804

score 362.62
score 362.02
score 361.78
score 363.04

actor loss -0.0024706852436065675

critic loss 103.04260359373093

score 358.58
score 355.78
score 351.24


score 401.7

actor loss -0.0026535153150558472

critic loss 33.28965921661853

score 401.7
score 401.7

actor loss -0.0017482802867889405

critic loss 41.86966042024493

score 401.7
score 397.72
score 397.72

actor loss -0.001552948033809662

critic loss 61.0050327560842

score 397.72
score 397.4

actor loss -0.003146198892593384

critic loss 58.43068617315292

score 397.4
score 397.4

actor loss 0.0010809835910797119

critic loss 36.91078734451532

score 398.08
score 398.04

actor loss 0.004655255311727523

critic loss 31.779465228694676

score 404.32
score 412.98

actor loss -0.00041780083179473874

critic loss 42.733370646262166

score 414.52
score 421.72

actor loss -0.0005004757106304169

critic loss 31.26929396984279

score 428.32
score 428.32

actor loss 0.0024935048937797548

critic loss 32.99928391034604

score 432.14
score 438.84

actor loss 0.0007823324203491209

critic loss 27.62625260273814

score 444.56
score 452.14

actor loss -0.0030504965066909793

critic loss 43.53898

score 469.84
score 469.84

actor loss -0.0018926313042640682

critic loss 40.4808507761836

score 469.84
score 469.84

actor loss -0.0022264891982078554

critic loss 35.04263538583517

score 469.84
score 464.64
score 473.48

actor loss -0.0074492763496935375

critic loss 25.53460564289093

score 477.0
score 482.66

actor loss -0.0010593824863433837

critic loss 37.28631306410134

score 482.66
score 483.22

actor loss -0.0041416301131248475

critic loss 23.6831524086535

score 483.36
score 483.36

actor loss -0.002410341024398803

critic loss 40.3406124973774

score 483.36
score 483.36

actor loss -0.0017510461688041688

critic loss 38.12033094628454

score 485.04
score 488.36

actor loss -0.002575196921825409

critic loss 38.92620246116519

score 488.36
score 488.36

actor loss -0.0017356985211372372

critic loss 41.7099525170058

score 488.96
score 488.96

actor loss -0.00018987144231796265

critic loss 45.07480864146501

score 489.7
score 489.7

actor loss -0.0015384427547454835

cri


actor loss -0.004719487199187279

critic loss 30.888550867570938

score 445.64
score 452.08

actor loss -0.004340596759319306

critic loss 35.36772888279408

score 453.56
score 453.56
score 448.7

actor loss -0.0028575590372085574

critic loss 49.86830022912324

score 446.74
score 445.42

actor loss -0.005386204168200494

critic loss 23.710773424386975

score 445.42
score 442.2

actor loss -0.004239662981033325

critic loss 27.018176290261742

score 444.18
score 444.18

actor loss -0.0025392142057418824

critic loss 26.61331457709074

score 444.18
score 446.42

actor loss -0.0017459713397547604

critic loss 20.885608780777453

score 446.42
score 446.42

actor loss -0.0020905699610710145

critic loss 31.21387576345205

score 445.76
score 445.76

actor loss -0.002479601639509201

critic loss 27.006513175743816

score 445.76
score 445.76

actor loss -0.004159130923449993

critic loss 23.183049196660516

score 445.76
score 447.24

actor loss -0.003315871512889862

critic loss 36.683840590

score 454.78
score 445.62
score 439.1
score 429.88
score 421.76
score 415.42
score 408.0
score 401.04

actor loss -0.0022913029909133915

critic loss 178.60746600289343

score 391.98
score 382.74
score 373.62
score 373.5

actor loss -0.011169262075424194

critic loss 85.15146347223519

score 380.72
score 377.46
score 375.64

actor loss -0.002835906136035919

critic loss 63.30974142723083

score 381.26
score 372.32
score 366.1
score 366.1

actor loss -0.00432683800458908

critic loss 86.56240324990154

score 362.24
score 362.24

actor loss -0.001932565796375275

critic loss 45.688611898386476

score 362.24
score 362.24

actor loss -0.002834998655319214

critic loss 46.33545242022872

score 362.24
score 362.24
score 352.62

actor loss -0.005934560906887054

critic loss 70.00754366548212

score 348.56
score 339.66
score 334.06
score 327.02
score 317.38
score 308.66
score 299.04
score 298.6
score 289.06
score 279.22
score 275.26
score 265.76

actor loss -0.013156449270248413

critic loss 2

critic loss 41.49698546408415

score 427.92
score 423.18

actor loss -0.0015084657549858092

critic loss 42.96923869848251

score 423.18
score 423.18

actor loss -0.004042971897125244

critic loss 41.645441392993924

score 423.18
score 423.18

actor loss -0.004758160960674286

critic loss 42.79375297679901

score 423.18
score 423.18
score 415.9
score 406.14

actor loss -0.0037142657876014706

critic loss 76.38426842310429

score 404.72
score 404.06

actor loss -0.004447483223676681

critic loss 30.665995873051884

score 404.06
score 404.06

actor loss -0.0018987581849098205

critic loss 39.753537738919256

score 409.28
score 416.64

actor loss -0.003998200023174286

critic loss 38.56373847126961

score 419.6
score 429.3
score 431.62

actor loss -0.004021390509605408

critic loss 54.20580075386763

score 439.88
score 435.96
score 438.48

actor loss -0.004784591317176819

critic loss 44.79602331574112

score 444.7
score 443.32

actor loss -0.004142441895604134

critic loss 27.38931222159

score 452.12

actor loss -0.003191373910754919

critic loss 42.66531719449759

score 452.12
score 460.7

actor loss -0.004730926162004471

critic loss 43.156245160627364

score 460.7
score 460.7

actor loss -0.004860478162765503

critic loss 43.124820226931575

score 465.36
score 465.36

actor loss -0.005336360919475555

critic loss 43.793477027177815

score 465.36
score 468.68
score 468.68

actor loss -0.006898675873875619

critic loss 69.24251815840006

score 465.16
score 460.28
score 468.9

actor loss -0.003112025284767151

critic loss 63.232122552990916

score 468.9
score 468.9

actor loss -0.0040072535634040835

critic loss 44.75491169807911

score 463.42
score 463.1

actor loss -0.003898132085800171

critic loss 39.773298810130356

score 465.28
score 465.28

actor loss -0.003167718893289566

critic loss 45.42920297600925

score 469.12
score 469.12

actor loss -0.005174249064922333

critic loss 43.59880429570675

score 469.12
score 469.12

actor loss -0.005807031285762787

critic 

score 451.16

actor loss -0.005651437538862229

critic loss 40.80849596469402

score 451.16
score 451.16

actor loss -0.005498487329483032

critic loss 41.59251427347958

score 451.16
score 451.16

actor loss -0.004237320023775101

critic loss 41.906254673826695

score 451.16
score 451.16

actor loss -0.0067684230983257295

critic loss 38.97384941877723

score 450.24
score 445.02
score 445.02

actor loss -0.0041243960738182065

critic loss 58.302001315930475

score 440.9
score 434.2
score 425.26
score 416.48
score 407.7
score 406.8
score 397.92
score 397.32
score 398.24
score 397.16
score 388.58
score 380.02
score 371.8
score 363.14

actor loss -0.0023982012778520577

critic loss 256.42479873660807

score 355.26
score 351.8
score 344.04
score 336.96

actor loss -0.0062317034423351285

critic loss 65.71805481573938

score 336.54
score 329.12
score 322.52
score 313.78
score 309.4

actor loss -0.008394197452068328

critic loss 78.3183374609202

score 306.5
score 302.92
score 299.32

actor

critic loss 43.058108100104334

score 329.8
score 338.86

actor loss -0.0042960664212703704

critic loss 43.36789315041899

score 347.56
score 356.9

actor loss -0.0012737714886665345

critic loss 42.634648708167674

score 366.32
score 373.34
score 374.54

actor loss -0.0014564395070075988

critic loss 60.945021883654604

score 378.68
score 383.88
score 384.26

actor loss -0.002213618338108063

critic loss 61.6669470997218

score 392.18
score 401.32

actor loss -0.0017152701973915101

critic loss 41.60976567620038

score 401.32
score 409.72

actor loss -0.002315362429618836

critic loss 39.32410244008154

score 410.36
score 419.46

actor loss -0.003342291092872619

critic loss 41.94353419212997

score 424.24
score 432.78

actor loss -0.005955500811338425

critic loss 39.75319858863055

score 432.78
score 432.78

actor loss -0.004690849101543426

critic loss 41.85047213431001

score 432.78
score 432.78

actor loss -0.004220232796669006

critic loss 41.04036319050043

score 438.24
score 

score 452.92
score 449.32

actor loss -0.003965691989660263

critic loss 40.94404454575777

score 449.32
score 449.32

actor loss -0.003759270870685577

critic loss 41.21626007761955

score 449.32
score 451.22
score 446.22

actor loss -0.005233035862445831

critic loss 59.217308320033545

score 450.82
score 450.82

actor loss -0.007435937201976775

critic loss 40.43888412679434

score 450.82
score 450.82

actor loss -0.005376025718450547

critic loss 40.83387209621071

score 448.02
score 440.16
score 438.68

actor loss -0.003446639680862426

critic loss 58.110132178366186

score 437.6
score 437.6

actor loss -0.002181817272305489

critic loss 39.049317888540024

score 437.6
score 437.6
score 430.4

actor loss -0.00283348183631897

critic loss 58.26772846068442

score 430.4
score 429.98
score 424.92

actor loss -0.003713098005717621

critic loss 57.740808490738274

score 424.92
score 424.92

actor loss -0.003710469532012939

critic loss 39.72437805047035

score 424.92
score 431.48

acto

critic loss 31.41546677230596

score 439.04
score 436.32
score 433.98

actor loss -0.0029936268568038936

critic loss 29.58490234547555

score 430.94
score 427.6

actor loss -0.0037935318171977996

critic loss 18.959121652910113

score 424.28
score 421.4
score 419.14

actor loss -0.00169414439201355

critic loss 21.422861874903738

score 416.22
score 412.42
score 410.76

actor loss -0.005524631178379059

critic loss 26.667754622589797

score 412.5
score 409.46
score 405.88

actor loss -0.00036966638565063485

critic loss 24.557595735312255

score 403.48
score 399.4
score 396.34

actor loss -0.0008232303977012632

critic loss 33.09517990336418

score 392.88
score 389.94
score 385.74

actor loss -0.0034513880610466006

critic loss 21.391099234306814

score 382.84
score 379.44
score 375.46

actor loss -0.004672389309108257

critic loss 17.478927109059693

score 372.02
score 368.16
score 364.04
score 364.0

actor loss -0.0055267248928546914

critic loss 25.503138171190024

score 367.06
sco

critic loss 42.38848741081952

score 463.36
score 467.88

actor loss -0.002477248048782349

critic loss 43.54224190317392

score 467.88
score 467.88

actor loss -0.003503403812646866

critic loss 42.898550997953855

score 470.58
score 475.02

actor loss -0.003602056330442429

critic loss 42.51184083299041

score 480.38
score 480.38

actor loss -0.0032718878209590913

critic loss 40.774335883784296

score 480.38
score 480.38

actor loss -0.004635785055160523

critic loss 42.00561425297856

score 480.38
score 480.38

actor loss -0.0037180033326148984

critic loss 41.613526727867125

score 480.38
score 480.38

actor loss -0.004514110767841339

critic loss 38.85813749902248

score 480.32
score 475.44
score 474.04

actor loss -0.005649753069877625

critic loss 43.10651928101181

score 475.88
score 485.62

actor loss -0.006230805277824401

critic loss 40.82137446403503

score 485.62
score 484.78

actor loss -0.0019903984069824217

critic loss 33.9258040353477

score 491.34
score 491.34

acto

critic loss 44.122323659935596

score 487.9
score 487.9

actor loss -0.008216602349281312

critic loss 41.03629850480259

score 487.9
score 487.9

actor loss -0.0078931081622839

critic loss 38.55142563689873

score 487.9
score 487.9

actor loss -0.003244603145122528

critic loss 39.45863276866824

score 487.9
score 487.9

actor loss -0.005190595924854278

critic loss 40.14874843548536

score 488.88
score 481.46
score 479.1
score 469.48

actor loss -0.003266705739498138

critic loss 87.74165617011786

score 469.24
score 469.24
score 461.76

actor loss -0.0005817892432212829

critic loss 65.09425892261862

score 461.76
score 459.72
score 451.88

actor loss -0.0016312856554985052

critic loss 61.9083398417756

score 451.88
score 451.88

actor loss -0.004967340883146971

critic loss 39.957415914058686

score 451.3
score 451.3

actor loss -0.0030818658173084263

critic loss 40.25087262686491

score 451.3
score 451.3

actor loss -0.004012030959129333

critic loss 44.1123703025937

score 446

score 471.1

actor loss -0.0028202076762914663

critic loss 27.697149546198553

score 471.1
score 471.1

actor loss -0.003948540306091308

critic loss 40.269988555216784

score 471.1
score 474.4

actor loss -0.004154890598356724

critic loss 41.96591339514852

score 474.78
score 474.78

actor loss -0.005236346399784088

critic loss 44.46223252966702

score 474.78
score 474.78

actor loss -0.006249177777767181

critic loss 41.74757364090942

score 474.78
score 479.18

actor loss -0.003983540797233582

critic loss 42.08330767046213

score 479.18
score 479.18

actor loss -0.004482112753391265

critic loss 45.65139442677349

score 479.18
score 479.18

actor loss -0.004626268577575683

critic loss 44.0028854991734

score 480.88
score 480.88
score 477.38

actor loss -0.003295356869697571

critic loss 63.88401552899778

score 477.38
score 472.88

actor loss -0.004975854909420013

critic loss 39.27122297576666

score 472.88
score 472.88

actor loss 8.402891159057617e-05

critic loss 40.0582694

critic loss 37.38849088466168

score 443.26
score 443.26

actor loss -0.0027286978185176855

critic loss 20.19748313258439

score 437.02
score 437.02
score 434.28

actor loss 0.00789618679434061

critic loss 30.987230160045623

score 435.48
score 435.48

actor loss -0.0010835671722888949

critic loss 27.579317712193728

score 435.48
score 435.48

actor loss -0.002226857178285718

critic loss 18.029659866987167

score 440.32
score 443.88

actor loss -0.005140532569214701

critic loss 22.47043762907162

score 448.14
score 446.6
score 447.48

actor loss -0.0054448771595954895

critic loss 25.200836782340705

score 451.48
score 448.56

actor loss -0.002768069413304329

critic loss 17.39638844574615

score 448.56
score 448.56

actor loss -0.0018760402739048006

critic loss 17.75372348955795

score 448.56
score 448.56

actor loss -0.002840978713473305

critic loss 20.365507944005728

score 456.26
score 456.26

actor loss -0.0068015736818313605

critic loss 18.146186459904907

score 457.44
sc

score 385.46

actor loss -4.6249258518219056e-05

critic loss 33.57486975981742

score 389.36
score 390.12

actor loss -0.005774826864898205

critic loss 20.967345146161318

score 391.6
score 385.06
score 390.0
score 385.72

actor loss -0.004787802483513952

critic loss 35.84990894652903

score 385.8
score 386.4

actor loss -0.0043646363615989685

critic loss 0.7650743801793084

score 381.44
score 371.66
score 369.2
score 372.88
score 369.62
score 364.8
score 361.46
score 353.94

actor loss -0.0120058198928833

critic loss 142.65743063649535

score 352.68
score 348.92
score 345.44
score 344.08
score 341.08
score 332.7

actor loss -0.012379825401306154

critic loss 101.42113698825837

score 332.7
score 336.06

actor loss -0.007296597017347813

critic loss 21.15347876005173

score 337.98
score 337.78

actor loss -0.004954336303472519

critic loss 19.299641656053065

score 340.04
score 340.32

actor loss 0.0004972738411277532

critic loss 22.689972087210414

score 344.6
score 341.84

acto

score 490.22

actor loss -0.0017192118644714354

critic loss 42.58970723838508

score 490.22
score 490.22

actor loss 0.0013455964326858521

critic loss 43.9769645753324

score 490.22
score 490.22

actor loss -0.002424483382701874

critic loss 41.86744325109721

score 490.22
score 490.22

actor loss -0.0005948546051979066

critic loss 42.23085872579738

score 490.22
score 490.22

actor loss -0.0009553586363792421

critic loss 47.38969684987068

score 490.22
score 490.22

actor loss -0.001027418005466461

critic loss 41.8304060264796

score 490.22
score 492.48

actor loss -0.002147184157371521

critic loss 42.323770453763004

score 493.38
score 495.24

actor loss -0.0014385684728622436

critic loss 43.10019578111768

score 495.24
score 495.24

actor loss -0.0030164661740884184

critic loss 41.49931102537512

score 495.24
score 495.24

actor loss -0.0013394294261932372

critic loss 41.517651214230064

score 495.24
score 495.24

actor loss 0.001247307002544403

critic loss 44.801948299252


actor loss 0.000537060105800629

critic loss 40.47487166995406

score 385.52
score 383.74
score 379.66
score 372.82

actor loss -0.00656105260848999

critic loss 30.429378473854065

score 372.82
score 372.82

actor loss -0.003993276071548461

critic loss 38.70761352171898

score 377.8
score 371.04

actor loss -0.0054404358625411995

critic loss 21.03575039542317

score 370.22
score 366.52
score 359.9
score 353.42

actor loss -0.007697459483146667

critic loss 20.81550432650372

score 353.42
score 347.92
score 345.0
score 341.62

actor loss -0.0066219211474061014

critic loss 28.272427034306524

score 341.06
score 339.52
score 336.82
score 338.46

actor loss -0.008716334056854248

critic loss 37.64892074693293

score 337.38
score 336.56
score 332.0
score 332.26

actor loss -0.012055282807350158

critic loss 25.648357951594885

score 339.28
score 339.28
score 333.18

actor loss -0.006094860923290253

critic loss 55.36115388317704

score 331.76
score 333.32

actor loss -0.006412425571866

score 463.82

actor loss -0.005367463234066964

critic loss 42.563201363015175

score 463.82
score 463.82

actor loss -0.00013780536986887455

critic loss 46.619231954079865

score 472.8
score 481.58

actor loss -0.007342383372783662

critic loss 44.29942628581524

score 481.58
score 481.58

actor loss -0.005256608289480209

critic loss 43.35204343931079

score 481.58
score 481.58

actor loss -0.006273972176015377

critic loss 42.8547455829978

score 481.58
score 481.58

actor loss -0.0058237189412117

critic loss 43.41438352923989

score 481.58
score 481.58

actor loss -0.008425304925441742

critic loss 40.96659262065292

score 481.58
score 481.58

actor loss -0.002069935470819473

critic loss 42.7230529865116

score 481.58
score 482.98

actor loss -0.004218030750751495

critic loss 42.64576726686954

score 482.98
score 482.98

actor loss -0.002226863944530487

critic loss 42.40406232635975

score 482.98
score 481.36
score 480.1

actor loss -0.005663033032417298

critic loss 62.071530

critic loss 36.77378851255178

score 460.32
score 465.5

actor loss -0.003911300814151765

critic loss 42.58832702271938

score 465.5
score 470.3

actor loss -0.0025816246688365936

critic loss 40.555002744430304

score 474.0
score 478.4

actor loss -0.008466890025138854

critic loss 33.64618252754509

score 478.4
score 481.56

actor loss -0.0022510609971359372

critic loss 35.75594286504984

score 484.74
score 489.18

actor loss -0.0018632492303848266

critic loss 39.77357286714315

score 491.26
score 495.5

actor loss -0.006947768664360046

critic loss 37.468574817585946

score 495.5
score 495.5

actor loss -0.0005908312082290648

critic loss 36.34696895354391

score 495.5
score 495.5

actor loss -0.003210654768720269

critic loss 35.581122967580704

score 495.5
score 495.5

actor loss -0.0041637756884098055

critic loss 35.17292100383044

score 495.5
score 495.5

actor loss -0.0028645818650722505

critic loss 33.72581583598852

score 495.5
score 495.5

actor loss -0.0004936044931411

score 361.58
score 357.54
score 356.56

actor loss -0.0002029047966003417

critic loss 72.47931898200662

score 352.14
score 354.84

actor loss -0.0036176965475082402

critic loss 52.76064877743721

score 352.18
score 354.08
score 356.86

actor loss -0.003719772469997406

critic loss 71.1988140088439

score 363.74
score 359.52
score 359.52

actor loss -0.005237530279159546

critic loss 71.16938564546406

score 354.24
score 348.82
score 343.96
score 339.3

actor loss -0.00068301512748003

critic loss 71.61006868714318

score 334.6
score 329.96
score 330.98
score 326.46

actor loss -0.005230438947677612

critic loss 54.05277774627954

score 329.48
score 324.22
score 319.54
score 318.14

actor loss -0.004184993296861649

critic loss 74.3621657537222

score 316.74
score 311.1
score 310.46

actor loss -0.009466211128234862

critic loss 65.85929501030445

score 311.28
score 314.22
score 308.88

actor loss -0.0009517278850078583

critic loss 54.83788061531186

score 307.48
score 304.68
score 

score 415.26
score 409.64
score 403.7

actor loss -0.0033724611520767208

critic loss 51.59086931439042

score 398.08
score 392.44
score 386.58
score 383.9
score 378.04

actor loss -0.0038271733760833746

critic loss 64.80777949721664

score 372.28
score 366.68
score 361.02
score 355.12

actor loss -0.001394885468482971

critic loss 53.6164313201964

score 355.12
score 349.28
score 343.36
score 337.42

actor loss -0.0030706999778747556

critic loss 47.48690839109421

score 337.1
score 331.2
score 325.3
score 319.48

actor loss -0.0005219918280839921

critic loss 43.389418044638624

score 319.48
score 313.5
score 308.0
score 302.12

actor loss -0.0017448536872863769

critic loss 42.09474811085463

score 302.12
score 296.82

actor loss -0.0021902382820844653

critic loss 31.713963029772042

score 297.36
score 297.36
score 297.72

actor loss -0.0012173068523406983

critic loss 47.992793238997464

score 291.98
score 292.48

actor loss -0.0013276207447052001

critic loss 21.78089982100129



critic loss 37.15234344925285

score 470.48
score 470.48

actor loss 0.025535429227352142

critic loss 37.130360344831644

score 470.48
score 470.48

actor loss -0.0006640777945518493

critic loss 40.360856830638646

score 476.82
score 476.82

actor loss 0.0006860924720764161

critic loss 37.64144561923742

score 476.82
score 476.82

actor loss -0.0011801067113876343

critic loss 39.75538889710009

score 476.82
score 476.82

actor loss 0.0024633681654930113

critic loss 36.83083394796998

score 476.82
score 476.82

actor loss 0.0010275945961475369

critic loss 38.45508456858396

score 476.82
score 476.82

actor loss 0.004196546110510826

critic loss 34.9363089869678

score 476.82
score 476.82

actor loss -0.0001760843634605408

critic loss 38.555936647912866

score 476.82
score 482.48

actor loss 0.003581132185459137

critic loss 38.049574351096155

score 488.68
score 488.68

actor loss -0.0005701646785251796

critic loss 36.87634986031354

score 488.68
score 488.68

actor loss -0.0019

score 419.08
score 421.26

actor loss -0.0019729859944432973

critic loss 27.174512031453105

score 423.68
score 426.28

actor loss -0.0023222474575042723

critic loss 23.211567491731046

score 429.24
score 432.36

actor loss -0.0051245410323143

critic loss 25.55386445836388

score 435.24
score 437.78

actor loss -0.0025641339257359503

critic loss 24.478199216218478

score 439.84
score 442.48

actor loss -0.001833795535564423

critic loss 22.346443982949857

score 445.1
score 447.6

actor loss -0.0026938736677169796

critic loss 26.112807381360977

score 451.64
score 453.7

actor loss -0.003208114993572235

critic loss 31.22013083376755

score 457.72
score 459.44

actor loss -0.007799643218517303

critic loss 31.263149953241644

score 462.76
score 465.14

actor loss -0.0046154725193977356

critic loss 27.491677883089704

score 466.02
score 469.74

actor loss 0.0013435251235961916

critic loss 28.42919887328651

score 471.42
score 474.6

actor loss 0.0017201572060585018

critic loss 2

score 496.92

actor loss 0.0009534182310104368

critic loss 27.714156738971177

score 497.18
score 498.04
score 496.88

actor loss 0.0032064831256866455

critic loss 40.373339801129696

score 496.18
score 494.14

actor loss -0.0018296448826789855

critic loss 17.545426748125628

score 492.86
score 489.68

actor loss -0.001465784138441086

critic loss 11.88931543787569

score 487.2
score 484.22
score 480.92

actor loss -0.00014520031213760396

critic loss 25.759095382872225

score 477.96
score 473.54
score 473.44

actor loss -0.0014936651229858402

critic loss 29.726445587866756

score 472.26
score 470.74

actor loss 0.011132758581638336

critic loss 20.823268625993656

score 469.28
score 467.92
score 464.86

actor loss -0.0007779562860727309

critic loss 16.655273049713646

score 462.46
score 462.02

actor loss -0.0023474279284477232

critic loss 14.687170351459457

score 457.8
score 454.64
score 454.64

actor loss 0.009778389430046082

critic loss 29.72555567519553

score 453.4
score 

critic loss 44.30035414081216

score 489.66
score 489.66

actor loss 0.00031219955682754516

critic loss 42.607973690355195

score 489.66
score 489.66

actor loss 0.007734485340118409

critic loss 44.89617181409597

score 489.66
score 489.66

actor loss -0.00038451672792434694

critic loss 43.9638845825702

score 489.66
score 487.92

actor loss 0.0012775285124778748

critic loss 23.38767873652726

score 487.92
score 487.92

actor loss -0.0012395554900169372

critic loss 41.977585213345286

score 487.92
score 487.92
score 484.92

actor loss -0.0004888226747512818

critic loss 45.753059479268266

score 481.96
score 480.4

actor loss -0.003416091980785131

critic loss 3.21324535650909

score 480.4
score 478.36
score 477.08

actor loss -0.007944401513040066

critic loss 12.371917435444892

score 476.44
score 475.28

actor loss -0.003237883742817212

critic loss 4.133812319621443

score 475.28
score 475.28

actor loss -0.003126561951637268

critic loss 46.54083060336113

score 475.28
score 

actor loss 0.0018763178348541261

critic loss 32.997527432930475

score 500.0
score 500.0

actor loss -0.0015457352093420922

critic loss 32.270071394383905

score 500.0
score 500.0

actor loss 0.0012465720996260642

critic loss 33.98971447075307

score 500.0
score 500.0

actor loss 8.99845004081726e-05

critic loss 31.746490862584114

score 500.0
score 500.0

actor loss 0.0012073047839105129

critic loss 28.0056975220263

score 500.0
score 500.0

actor loss 0.0003965075120329857

critic loss 27.822469125607608

score 500.0
score 500.0

actor loss -0.0002034157839603722

critic loss 35.11894147487878

score 500.0
score 500.0

actor loss 0.002000622418522835

critic loss 27.51477688333988

score 500.0
score 500.0

actor loss -0.0023315294936299322

critic loss 32.64209239381925

score 500.0
score 500.0

actor loss -0.0011416076123714448

critic loss 31.987864195616538

score 500.0
score 500.0

actor loss -0.001057053571939468

critic loss 37.44932369872164

score 500.0
score 496.84
scor

critic loss 31.389504315483567

score 487.04
score 487.04

actor loss -0.004236281257867814

critic loss 38.531180418586736

score 487.04
score 487.04

actor loss -0.005891335570812225

critic loss 29.537959764301775

score 487.04
score 487.04

actor loss -0.0033569288820028305

critic loss 33.93284988987447

score 487.04
score 487.04

actor loss -0.006021698969602585

critic loss 33.2714721317172

score 487.04
score 487.04

actor loss -0.0032908140182495117

critic loss 31.30505076377392

score 487.04
score 487.04

actor loss -0.0035141389578580854

critic loss 16.531059715360406

score 487.04
score 487.04

actor loss -0.0035687746763229367

critic loss 28.977875374650957

score 487.04
score 487.04

actor loss -0.005806668245792389

critic loss 24.478018688520788

score 487.04
score 487.04

actor loss -0.003822054660320283

critic loss 25.853148387363554

score 487.04
score 487.04

actor loss -0.003898083299398423

critic loss 31.01038535917997

score 487.04
score 487.04

actor loss -

score 490.34

actor loss -0.005294306102395058

critic loss 29.803498354002834

score 490.34
score 490.34

actor loss -0.002547740215808153

critic loss 30.034518445658684

score 490.34
score 490.34

actor loss -0.004890017667040229

critic loss 29.932229612141846

score 490.34
score 490.34

actor loss 0.0028701790302060543

critic loss 39.2057537535727

score 490.34
score 491.58

actor loss -0.00446273504793644

critic loss 31.1994138977617

score 491.58
score 491.58

actor loss -0.003724671772681176

critic loss 35.20335066544414

score 495.88
score 495.88

actor loss -6.061542034149423e-06

critic loss 31.929843975934382

score 495.88
score 495.88

actor loss -0.004576867467164993

critic loss 32.80626356847286

score 495.88
score 495.88

actor loss -0.004261035639047622

critic loss 34.456614188337326

score 495.88
score 495.88

actor loss -0.004717298150062561

critic loss 33.33289775836467

score 496.72
score 496.72

actor loss -0.0041705093562603

critic loss 34.44372709329725



score 430.4

actor loss -0.004885690462589264

critic loss 33.64497219681739

score 430.4
score 437.12

actor loss -0.0052989474490284915

critic loss 33.191788422536845

score 444.34
score 450.96

actor loss -0.004226495432108641

critic loss 33.42047869644165

score 454.9
score 454.9

actor loss -0.0062407767653465274

critic loss 32.74599676953554

score 459.9
score 464.66

actor loss -0.004432849053293467

critic loss 32.59854522899687

score 466.4
score 474.6

actor loss -0.0064065239503979686

critic loss 31.840080029669405

score 479.42
score 485.16

actor loss -0.007429737836122513

critic loss 32.48627915315628

score 490.08
score 490.08

actor loss -0.000940740031003952

critic loss 33.97209825580121

score 493.84
score 500.0

actor loss -0.0057703681290149685

critic loss 31.594253184294693

score 498.62
score 498.62

actor loss -0.005786589312553407

critic loss 29.95543652479649

score 498.62
score 498.62

actor loss -0.0030931200847029686

critic loss 31.954243804782628



score 409.58

actor loss -0.004234762543439865

critic loss 30.126484015239775

score 409.58
score 409.58

actor loss -0.0035214407920837404

critic loss 27.973248127481337

score 409.58
score 409.58

actor loss -0.0005523397862911225

critic loss 34.16791343049108

score 409.58
score 409.58

actor loss -0.0034782125234603884

critic loss 37.891701155123116

score 409.58
score 409.58

actor loss -0.001538649719953537

critic loss 29.18264904997349

score 409.58
score 409.58

actor loss -0.0013327062487602233

critic loss 35.95553388122842

score 409.58
score 410.58

actor loss -0.003682867670059204

critic loss 39.3663859219253

score 410.84
score 411.74

actor loss -0.0023324801206588744

critic loss 39.88668222894669

score 412.54
score 415.92

actor loss -0.0033457247912883755

critic loss 38.02879928724468

score 418.04
score 418.2

actor loss -0.0040743592381477355

critic loss 37.91555690331757

score 419.02
score 419.02

actor loss -0.004867330896854401

critic loss 39.313476988

score 488.04
score 488.04

actor loss -0.002863245487213135

critic loss 42.43525474222302

score 488.04
score 488.04

actor loss 0.0005996103584766388

critic loss 43.51116233167201

score 492.14
score 492.14

actor loss -0.0003304288387298584

critic loss 42.4730404865861

score 489.72
score 489.72

actor loss -0.002670064625144005

critic loss 40.91197865186929

score 489.72
score 489.72

actor loss -0.0008711101293563842

critic loss 39.45947876351178

score 489.72
score 489.72

actor loss -0.005964173278212547

critic loss 39.936525005885954

score 489.72
score 489.72

actor loss -0.0013170778393745421

critic loss 38.89542532868087

score 489.72
score 489.72

actor loss -0.004667638391256333

critic loss 38.23131357180476

score 489.72
score 489.72

actor loss -0.0008603120803833006

critic loss 38.73811497449279

score 489.72
score 489.72

actor loss 0.0005407588481903076

critic loss 41.65487412951812

score 489.72
score 489.72

actor loss -0.0029040321588516237

critic loss 42

critic loss 39.61840799593031

score 477.76
score 477.76

actor loss -0.0005342073500156404

critic loss 34.63398009073436

score 477.76
score 477.76

actor loss -0.0017801822535693645

critic loss 38.16212772010714

score 477.76
score 477.76

actor loss -0.002729583501815796

critic loss 41.614789361649756

score 477.76
score 482.46

actor loss -0.0027055103957653046

critic loss 38.161631137922406

score 482.46
score 482.46

actor loss -0.0008103303626179696

critic loss 38.9004875942234

score 482.46
score 485.5

actor loss -0.0032626559972763064

critic loss 40.2338335999161

score 485.5
score 485.5

actor loss -0.003325767385959625

critic loss 42.355615450374785

score 485.5
score 485.5

actor loss -0.0041288220167160035

critic loss 38.127339216652516

score 489.44
score 489.44

actor loss 0.0018889917373657225

critic loss 44.521634164069965

score 489.44
score 489.44

actor loss -0.0025197385430336

critic loss 40.3193525443621

score 489.44
score 489.44

actor loss 0.00784932

score 428.26
score 428.26

actor loss -0.0009753090351819992

critic loss 38.14914794718028

score 421.88
score 421.88

actor loss -0.0025756579995155336

critic loss 36.32159608368874

score 421.88
score 421.88

actor loss -0.003229953002929687

critic loss 39.84419096671343

score 421.88
score 421.88

actor loss -0.004786599779129029

critic loss 41.61159819133282

score 421.88
score 421.88
score 418.3

actor loss -0.003004438257217407

critic loss 56.26507530493736

score 418.3
score 418.3

actor loss -0.003801248207688332

critic loss 39.299663492792845

score 421.14
score 421.14

actor loss -0.0030888302981853487

critic loss 39.525669438928375

score 421.14
score 421.14

actor loss -0.0034573997378349306

critic loss 45.659659247535465

score 421.14
score 421.14

actor loss -0.003082993066310882

critic loss 43.49577416968346

score 420.68
score 420.68

actor loss -0.0009938111662864686

critic loss 38.10998147528768

score 426.46
score 430.92

actor loss -0.0035171272516250607



critic loss 28.401732205865535

score 484.26
score 483.7
score 474.72

actor loss -0.001249803525209427

critic loss 62.01019732190372

score 470.86
score 470.86

actor loss -0.002322814607620239

critic loss 41.147763818275926

score 470.86
score 463.36
score 458.18
score 457.18

actor loss -0.004705515480041503

critic loss 80.58611216448843

score 457.18
score 457.18
score 450.12

actor loss -1.3063076138496426e-05

critic loss 58.677998728635906

score 445.08
score 445.08

actor loss -0.0033118030309677122

critic loss 40.350855697575206

score 445.08
score 440.92
score 439.52

actor loss -0.006263927364349366

critic loss 45.264664121589064

score 441.76
score 441.08
score 432.76

actor loss -0.003265673100948334

critic loss 49.5236558732152

score 434.5
score 434.5

actor loss -0.004990978395938874

critic loss 44.019703684964774

score 434.5
score 434.5

actor loss 0.0015159222960472105

critic loss 28.585342611062526

score 434.5
score 434.5

actor loss 0.0029873786807060243



score 496.66

actor loss -0.0022959448456764224

critic loss 38.53362267030477

score 496.66
score 496.66

actor loss -0.0034308012306690215

critic loss 39.76110239826441

score 496.66
score 496.66

actor loss -0.003370905525237322

critic loss 39.672702991305286

score 496.66
score 496.66

actor loss -0.00321846774071455

critic loss 38.94950663996264

score 496.66
score 496.66

actor loss -0.007948155084252357

critic loss 39.78360596117973

score 496.66
score 496.66

actor loss -0.007942548429965973

critic loss 45.393187987786526

score 496.66
score 496.66
score 488.46

actor loss -0.004555722707509995

critic loss 58.442159342774005

score 486.9
score 483.12
score 479.7

actor loss -0.005397745156288147

critic loss 45.12482888842486

score 479.7
score 479.7

actor loss -0.00470142188668251

critic loss 41.09335449704155

score 477.1
score 477.1

actor loss -0.0019609615087509157

critic loss 39.61906661486923

score 477.1
score 477.1

actor loss -0.0021342408537864685

critic lo

critic loss 41.11655993489623

score 480.28
score 480.28

actor loss -0.0019879327893257146

critic loss 41.54893407102675

score 480.28
score 475.04

actor loss -0.00025746520161628727

critic loss 38.65909634299278

score 476.76
score 476.76

actor loss -0.003948489320278169

critic loss 45.766707945500315

score 476.76
score 476.76

actor loss 0.001122805380821228

critic loss 43.7979592586562

score 476.76
score 479.14

actor loss -0.002261807060241699

critic loss 42.54811117176115

score 479.14
score 478.1
score 473.1

actor loss -0.0023993911385536194

critic loss 55.44454020154923

score 472.22
score 472.22
score 467.54

actor loss -0.0029719357013702394

critic loss 58.72997367512286

score 469.98
score 469.98

actor loss -0.002229914343357086

critic loss 43.396043133455514

score 468.88
score 468.88

actor loss 0.0013130741357803347

critic loss 39.962775800518685

score 468.88
score 468.88

actor loss -0.0004310261607170105

critic loss 43.20655846491428

score 468.88
score

score 458.66

actor loss -0.002200601625442505

critic loss 43.87409631890505

score 458.66
score 458.66

actor loss 0.0005129897713661196

critic loss 41.472938430532814

score 458.66
score 458.66

actor loss -0.002168767464160919

critic loss 45.64070968408585

score 462.4
score 462.4

actor loss -0.0007428478240966796

critic loss 45.046909052453934

score 466.02
score 466.02

actor loss 0.0014212633848190309

critic loss 44.52594870724082

score 470.88
score 475.52

actor loss 0.0019479441642761234

critic loss 42.18877200964688

score 479.34
score 483.18

actor loss -0.0010397358655929564

critic loss 44.442289035972955

score 486.26
score 486.26

actor loss 0.010784891283512114

critic loss 42.64938405380546

score 486.26
score 486.26

actor loss 0.00258647564649582

critic loss 43.23598534207046

score 487.96
score 487.96

actor loss -0.0032772753596305845

critic loss 41.927705960361656

score 487.96
score 490.24

actor loss -0.002030401480197906

critic loss 39.41010577918739


critic loss 1.092521987547353

score 456.08
score 457.7

actor loss -0.003069225025177002

critic loss 3.8818917466595773

score 457.7
score 459.72

actor loss 0.0007289807736873627

critic loss 12.087897751276195

score 459.72
score 459.14

actor loss -0.00505318835452199

critic loss 15.731408037880808

score 459.14
score 460.22

actor loss -0.0025314247369766234

critic loss 40.342640640053524

score 463.92
score 464.28

actor loss -0.0027391733472235504

critic loss 17.20712204561159

score 463.16
score 463.58

actor loss -0.007113008585572243

critic loss 16.316309445820004

score 463.58
score 465.34

actor loss 0.00477292063832283

critic loss 43.548587222725146

score 467.86
score 467.86
score 464.48

actor loss -0.003990750586986542

critic loss 55.80156184045821

score 461.28
score 457.32
score 452.6
score 447.56

actor loss 0.006221907663159072

critic loss 41.07067098586559

score 442.98
score 441.44
score 441.48

actor loss 0.0015806970179080963

critic loss 47.706106732552

score 494.68

actor loss -0.0013142924070358275

critic loss 34.69289187199772

score 496.98
score 498.74

actor loss -0.0010117697894573212

critic loss 34.46306800910681

score 499.52
score 499.52

actor loss -0.0006162091791629791

critic loss 33.77491391381621

score 499.52
score 499.52

actor loss -0.0009308810353279113

critic loss 34.9426893786233

score 499.52
score 499.52

actor loss -0.003827932953834534

critic loss 33.8235017091319

score 499.52
score 499.52

actor loss -0.0012369217693805694

critic loss 34.54946290660538

score 499.52
score 499.52

actor loss -0.005724332827329636

critic loss 35.016117551682896

score 499.52
score 499.52

actor loss -0.001700742816925049

critic loss 33.562010676416016

score 499.52
score 499.52

actor loss -0.0014777442455291747

critic loss 33.50136870114841

score 499.52
score 499.52

actor loss -0.0006692167758941649

critic loss 32.57279713976682

score 499.52
score 499.52

actor loss 0.0005065930485725403

critic loss 32.2323351506

critic loss 34.66697744672969

score 417.9
score 420.84

actor loss -0.0016501362442970274

critic loss 26.82621653722972

score 421.08
score 422.58

actor loss -0.0038065806746482847

critic loss 25.209989482320843

score 424.82
score 423.2
score 426.04

actor loss -0.0029516922712326055

critic loss 41.923348991164566

score 428.0
score 430.24

actor loss -0.0031869896531105044

critic loss 30.26403402422061

score 430.96
score 432.74

actor loss -0.0039241957426071165

critic loss 45.379681385894116

score 433.14
score 435.78

actor loss -0.002436513638496399

critic loss 35.14428797304332

score 437.82
score 441.54

actor loss -0.001956421446800232

critic loss 30.84857571953945

score 442.42
score 444.32

actor loss -0.003631573033332825

critic loss 34.61391373286341

score 447.42
score 450.16

actor loss -0.002095486783981323

critic loss 33.636206621147686

score 452.06
score 456.08

actor loss -0.004240752547979355

critic loss 30.94466582199335

score 457.96
score 457.72

act

actor loss -0.0009950839817523959

critic loss 18.51018042852548

score 476.46
score 472.84
score 470.08

actor loss -0.005622146797180176

critic loss 37.011231374587865

score 470.08
score 469.46

actor loss -0.005366319417953491

critic loss 19.73640315934736

score 468.32
score 464.98

actor loss 0.008442897325754166

critic loss 11.020475852891057

score 462.0
score 462.88
score 459.72

actor loss -0.0037336565136909484

critic loss 26.536655902472138

score 461.02
score 460.3

actor loss 0.005005077719688415

critic loss 8.853670086978376

score 460.3
score 460.3

actor loss 0.00403228381872177

critic loss 23.60729540667087

score 460.3
score 460.84

actor loss -0.0034857306361198424

critic loss 32.354919863336534

score 460.84
score 457.42

actor loss -0.003777642595767975

critic loss 24.051574498723447

score 457.42
score 455.94
score 455.94

actor loss 0.003931037521362304

critic loss 40.87212354861274

score 454.22
score 455.42

actor loss -0.0031304461002349855

critic l

score 489.28
score 489.28

actor loss -0.003715732169151306

critic loss 31.024774144675394

score 489.28
score 489.28

actor loss -0.0048485417723655696

critic loss 30.410935256976636

score 489.28
score 487.38

actor loss -0.004962538242340088

critic loss 26.347335058209303

score 487.94
score 485.74

actor loss -0.003309093070030212

critic loss 26.312714832641184

score 484.74
score 482.36

actor loss -0.003631617951393127

critic loss 22.55046357397139

score 482.36
score 482.36

actor loss -0.003924122357368469

critic loss 29.329533874324703

score 482.36
score 482.36
score 480.36

actor loss -0.003175077509880066

critic loss 40.07948832996189

score 482.46
score 482.46

actor loss -0.002017189672589302

critic loss 30.221097058662775

score 483.86
score 483.86

actor loss 0.0029387233614921572

critic loss 29.277558552018736

score 483.82
score 484.62

actor loss -0.0009891055941581726

critic loss 20.206234397302193

score 484.62
score 484.62

actor loss -0.0001354653835296

score 482.82
score 482.82

actor loss -0.0004371922433376313

critic loss 35.24863357591629

score 485.56
score 486.32

actor loss -0.0029250383237376812

critic loss 13.461543775622545

score 486.92
score 486.94

actor loss -0.0051006880402565

critic loss 27.6328219836548

score 487.38
score 488.38

actor loss 0.0005583559989929198

critic loss 21.490062159926072

score 488.38
score 488.38

actor loss -0.003602517464756966

critic loss 22.175367844058577

score 488.38
score 486.72

actor loss -0.004735893446207047

critic loss 32.49535366524011

score 486.72
score 486.72

actor loss -0.002243415975570679

critic loss 31.5995364966102

score 486.34
score 485.6

actor loss -0.006204921805858612

critic loss 25.27630832968168

score 485.6
score 485.6

actor loss -0.0024693318128585816

critic loss 32.10700597038492

score 485.6
score 485.6

actor loss -0.002483660793304443

critic loss 35.24054251058847

score 485.6
score 485.6

actor loss -0.0027452898502349854

critic loss 34.85046737

score 492.18

actor loss -0.0031864609327167275

critic loss 19.809545098825545

score 492.18
score 492.18

actor loss -0.0035004152536392214

critic loss 17.473229580424725

score 492.18
score 492.18

actor loss -0.005961431492865086

critic loss 17.04299413597733

score 492.18
score 492.18

actor loss -0.0034634508490562444

critic loss 14.722053756264646

score 492.18
score 492.18

actor loss -0.00726799508035183

critic loss 12.253704311141371

score 492.18
score 492.18

actor loss -0.003963580429553986

critic loss 27.070526370206473

score 489.54
score 489.54

actor loss -0.003985032331943512

critic loss 31.49942122650445

score 486.6
score 486.6

actor loss -0.002968973582983017

critic loss 23.496379609675706

score 488.12
score 488.12

actor loss -0.0041568296194076535

critic loss 19.091656152332575

score 488.12
score 488.12

actor loss -0.003770601141452789

critic loss 28.989638103170694

score 487.82
score 487.82

actor loss -0.0025687299966812138

critic loss 17.1839463

score 472.96
score 472.96

actor loss -0.0011432849317556247

critic loss 22.175337863574505

score 472.96
score 472.96

actor loss -0.0008206054262816906

critic loss 2.700227621070296

score 472.96
score 472.96

actor loss -0.004554430435597897

critic loss 11.14833595161289

score 472.96
score 472.96

actor loss -0.0028918599367141725

critic loss 13.4150973051887

score 472.96
score 472.96

actor loss -0.0009474180966615676

critic loss 9.360418487704731

score 474.68
score 474.68

actor loss -0.0030180655776872295

critic loss 22.4206086749997

score 474.68
score 476.64

actor loss -0.0045326745986938475

critic loss 26.895486553712185

score 480.36
score 480.36

actor loss -0.003070679140090942

critic loss 21.841845079570636

score 480.36
score 480.36

actor loss 0.0029777817010879512

critic loss 41.7452099104926

score 480.36
score 480.36

actor loss 0.0007325389146804811

critic loss 39.87217256016135

score 480.36
score 480.36

actor loss 0.0014755245804786681

critic loss 4

score 488.14

actor loss 0.0006880613327026367

critic loss 26.995965952575023

score 488.14
score 488.14

actor loss 0.0014802585840225219

critic loss 35.11453589615971

score 488.14
score 486.12

actor loss 0.0031493965864181515

critic loss 25.209099029183573

score 481.08
score 481.08

actor loss -0.0015888969063758852

critic loss 32.032131994281336

score 479.98
score 479.98

actor loss -0.0042814084172248836

critic loss 20.26308655493036

score 479.78
score 476.72
score 476.72

actor loss -0.0025620122373104103

critic loss 20.328337593775615

score 472.46
score 472.46

actor loss -0.0060468031525611875

critic loss 23.33298480568491

score 472.46
score 473.8

actor loss 0.0002578045725822449

critic loss 31.714265851926058

score 471.6
score 471.6

actor loss -0.005733970582485199

critic loss 20.24696472528502

score 471.6
score 471.6

actor loss -0.005000606620311737

critic loss 39.84728149653077

score 471.6
score 471.6

actor loss -0.0007070532321929932

critic loss 44.7


actor loss -0.00389050806760788

critic loss 33.01349415791258

score 433.8
score 433.8

actor loss -0.006378820610046387

critic loss 35.05746676081121

score 438.4
score 438.4

actor loss -0.003656658887863159

critic loss 35.363000942984215

score 438.4
score 438.4

actor loss -0.003023226475715637

critic loss 33.85069672451467

score 440.04
score 442.88

actor loss -0.0024267244756221774

critic loss 36.88761837126612

score 448.3
score 446.2
score 444.96

actor loss -0.004237946572899818

critic loss 42.218437963894004

score 444.96
score 447.8

actor loss -0.005604681634902954

critic loss 36.01825417643115

score 447.92
score 445.36

actor loss 0.0005535688400268553

critic loss 35.234840054048604

score 445.36
score 450.24

actor loss -0.003598298877477646

critic loss 33.34806552035212

score 453.24
score 453.24

actor loss -0.002684383526444435

critic loss 37.45614324288387

score 453.24
score 453.24

actor loss -0.005645991885662079

critic loss 30.161416683948413

score 


actor loss -0.0017628805041313173

critic loss 15.937327569421381

score 494.52
score 494.52

actor loss -0.002624040989432251

critic loss 23.148289753475783

score 494.52
score 494.52

actor loss -0.002686288229050115

critic loss 19.559532552194597

score 494.52
score 494.52

actor loss -0.002663346719369292

critic loss 21.725638292440024

score 494.52
score 494.52

actor loss -0.0019023478826507925

critic loss 15.531375244032592

score 494.52
score 494.52

actor loss -0.00015848552435636528

critic loss 20.012553695985677

score 494.52
score 494.52

actor loss -0.0033225317582488063

critic loss 20.343329881684486

score 494.52
score 494.52

actor loss -0.0015837192416191103

critic loss 19.575806981523336

score 494.52
score 498.68

actor loss -0.005641933554410935

critic loss 20.490477193713932

score 498.68
score 498.68

actor loss -0.0014370811104774475

critic loss 20.064866375756264

score 498.68
score 498.86

actor loss -0.004921867618709802

critic loss 21.9862505145713

critic loss 21.92512451489568

score 447.74
score 447.74

actor loss -0.004371383571624756

critic loss 25.158424290379884

score 447.74
score 447.74

actor loss -0.003954701726976782

critic loss 21.612335278451443

score 455.16
score 454.66

actor loss -0.007246704351902009

critic loss 24.80412469294071

score 454.66
score 462.62

actor loss -0.00451079823449254

critic loss 20.418351506179572

score 471.18
score 471.18

actor loss -0.004118640202283859

critic loss 23.668105937188862

score 471.18
score 470.04
score 469.58

actor loss -0.00489850460588932

critic loss 28.063882369720936

score 469.58
score 476.86

actor loss -0.00451256445646286

critic loss 25.98993812765777

score 476.86
score 477.18

actor loss -0.002450181403756142

critic loss 27.447626080036162

score 484.42
score 484.42

actor loss -0.0034493512123823173

critic loss 23.10932325352132

score 490.36
score 490.36

actor loss -0.004212540757656097

critic loss 28.43514428189993

score 490.36
score 490.36

actor


actor loss -0.0039855585932731625

critic loss 36.0737777107358

score 490.72
score 490.72

actor loss -0.0006930541038513184

critic loss 33.703843820858005

score 490.72
score 490.72

actor loss -0.0008516416430473326

critic loss 34.88545137878061

score 490.72
score 490.72

actor loss -0.0023306042075157164

critic loss 26.85922155587673

score 490.72
score 490.72

actor loss -0.002594143497943878

critic loss 27.092455156208576

score 492.26
score 492.12

actor loss -0.004397275590896607

critic loss 21.630075477238

score 491.4
score 491.4

actor loss -0.002588889238238335

critic loss 25.898199306886646

score 491.4
score 491.4

actor loss -0.0031487457334995273

critic loss 29.22192620649189

score 491.4
score 491.4

actor loss -0.0010102562308311463

critic loss 26.01645520177782

score 491.4
score 491.3
score 489.46

actor loss -0.0033426633358001707

critic loss 30.095527240069952

score 489.46
score 489.46

actor loss -0.003128717242181301

critic loss 35.535187142408084



score 484.44

actor loss 0.00012359226346015948

critic loss 26.868043942208583

score 484.44
score 483.28

actor loss -0.0002446771204471589

critic loss 31.188593148426712

score 483.28
score 483.28

actor loss 0.001064309448003769

critic loss 39.0045034408547

score 483.28
score 482.76

actor loss -0.0012207658767700194

critic loss 33.839095493118464

score 482.76
score 482.76

actor loss 0.003564141058921813

critic loss 33.99114759887159

score 481.78
score 481.78

actor loss 0.002130974090099335

critic loss 22.074399646259845

score 481.78
score 481.76

actor loss 0.0009062974810600279

critic loss 24.917824101802708

score 481.76
score 481.76

actor loss -0.002888789115101099

critic loss 29.389474774152042

score 480.92
score 479.12
score 478.06

actor loss -0.0015170273184776306

critic loss 26.61032310949303

score 478.06
score 480.12

actor loss -0.003493410873413086

critic loss 30.331382630622386

score 480.12
score 480.12

actor loss -0.0024820600986480714

critic loss

actor loss -0.003320883917808533

critic loss 7.066433054295554

score 483.52
score 480.52

actor loss -0.004668897223472595

critic loss 8.167744113683515

score 480.52
score 480.52

actor loss -0.0024899185828864577

critic loss 7.962855274240672

score 480.52
score 480.52

actor loss 0.0002933161318302155

critic loss 25.206690292849764

score 480.16
score 480.16

actor loss -0.001343023270368576

critic loss 2.78869587308988

score 478.3
score 478.24

actor loss -0.004661747431755066

critic loss 5.403240037836507

score 478.22
score 477.44

actor loss -0.005506946033239365

critic loss 5.204336736471205

score 477.44
score 477.44

actor loss -0.005382176530361176

critic loss 7.791361620626598

score 477.44
score 474.12
score 471.9

actor loss -0.003947670710086822

critic loss 23.35506216389537

score 471.9
score 471.9

actor loss -0.003248342323303223

critic loss 14.47636158023216

score 471.9
score 471.9

actor loss -0.006713943290710449

critic loss 22.767705641311778

score 

critic loss 25.1138189142175

score 485.16
score 485.16

actor loss -0.0015452000021934508

critic loss 37.02931575501263

score 485.16
score 482.36

actor loss -0.0011951577842235566

critic loss 23.50156833052337

score 482.36
score 482.36

actor loss -0.001897891807556152

critic loss 37.75355330883637

score 482.36
score 482.36

actor loss 5.7818287611007704e-05

critic loss 23.570933001582326

score 482.36
score 482.36

actor loss -0.0015102888569235803

critic loss 11.210980332155527

score 482.36
score 482.36

actor loss 0.0002199613213539123

critic loss 43.036411294184624

score 482.74
score 482.74

actor loss 0.0028616188287734984

critic loss 37.358580407830324

score 482.74
score 486.4

actor loss 0.002435239219665527

critic loss 23.6191486171633

score 487.5
score 489.44

actor loss -0.0012138565301895142

critic loss 9.956731476663798

score 489.44
score 489.44

actor loss -0.0007608462393283844

critic loss 22.405082261045276

score 490.38
score 490.38

actor loss 0.002

score 440.52
score 441.22

actor loss -0.004221631827950477

critic loss 22.019887059369683

score 441.22
score 441.22

actor loss -0.004134710371494293

critic loss 25.871238683047892

score 441.22
score 441.22

actor loss -0.000773321497440338

critic loss 28.553790326364332

score 441.22
score 441.22

actor loss -0.0008071445941925049

critic loss 36.382760668759786

score 441.22
score 441.22

actor loss -0.003485830402374268

critic loss 29.460423403207955

score 441.22
score 441.22

actor loss -0.003093350765109062

critic loss 30.05838682500422

score 441.22
score 441.22

actor loss -0.0014202193349599841

critic loss 33.502293520507216

score 448.92
score 455.6

actor loss -0.0011245633840560913

critic loss 31.479373204752807

score 456.82
score 456.82

actor loss -0.0023351036190986637

critic loss 30.250618595159057

score 456.82
score 459.8

actor loss -0.0025704521894454957

critic loss 30.393923198902606

score 459.8
score 462.94

actor loss -0.002264833064377308

critic l

score 386.9
score 386.9

actor loss -0.00047839535176753996

critic loss 35.6286150621891

score 386.9
score 386.9

actor loss -0.0045580774143338205

critic loss 35.348570187163354

score 386.9
score 386.9

actor loss -0.0004660113632678985

critic loss 40.784767965960505

score 386.9
score 386.9

actor loss 0.0008038594961166382

critic loss 32.183500640222434

score 386.9
score 386.9

actor loss -0.001374033695459366

critic loss 36.949214769274

score 385.82
score 387.96
score 387.9

actor loss 0.004722031259536743

critic loss 38.030148226642616

score 391.0
score 393.98

actor loss 0.005528090670704842

critic loss 30.094216458314655

score 397.42
score 405.52

actor loss 0.0012814741760492324

critic loss 41.930747897225615

score 407.88
score 415.58

actor loss -0.0017555035471916198

critic loss 36.90586134030819

score 422.44
score 424.84

actor loss -0.0008416871309280397

critic loss 36.94010729255676

score 433.12
score 441.06

actor loss -0.0014192827373743057

critic los

score 472.66
score 472.66

actor loss -0.0022922948956489563

critic loss 55.886851627580825

score 472.66
score 472.66

actor loss -0.0034413225501775746

critic loss 37.879612315677846

score 472.66
score 469.74

actor loss -0.0040130704760551455

critic loss 39.00969211153985

score 469.74
score 469.74

actor loss -0.0028915260791778563

critic loss 43.02844897915124

score 469.74
score 469.74

actor loss -0.001677837145328522

critic loss 40.86052609848827

score 469.08
score 469.08
score 464.66

actor loss -0.0046375197172164925

critic loss 52.695614168059834

score 464.66
score 464.66

actor loss -0.0019177336633205415

critic loss 40.30799456005693

score 464.66
score 464.66

actor loss -0.0012700253129005433

critic loss 39.92142340002433

score 464.66
score 464.66

actor loss -0.002589234882593155

critic loss 42.01107118245066

score 464.66
score 459.7

actor loss -0.0005270694881677627

critic loss 40.69750267100036

score 459.7
score 459.7

actor loss -0.000692555713653564

score 484.96
score 484.08

actor loss 0.0026092070102691645

critic loss 44.09166034922675

score 484.08
score 484.08

actor loss 0.013860909128189085

critic loss 40.74202607977539

score 481.96
score 483.5
score 480.06

actor loss -0.00030418209135532376

critic loss 64.44268832934797

score 476.82
score 472.22
score 468.62

actor loss 0.000250000011920929

critic loss 56.860313943830135

score 464.0
score 461.2
score 457.38

actor loss -0.0005325267195701599

critic loss 55.16456248248816

score 453.3
score 449.3
score 448.7

actor loss -8.065292835235595e-05

critic loss 55.46366179575771

score 444.84
score 440.68
score 440.26

actor loss -4.989147186279298e-05

critic loss 53.338626554588224

score 434.6
score 428.08
score 424.46
score 420.56

actor loss 0.0014679531097412113

critic loss 73.06332624915838

score 417.3
score 414.12
score 410.3

actor loss -0.0037771290302276604

critic loss 52.24627369111404

score 405.96
score 402.12
score 398.44

actor loss -0.00284346226453781

critic loss 12.150558467870951

score 481.9
score 481.9

actor loss 0.01982669443488121

critic loss 12.8857382881552

score 476.2
score 470.32
score 470.32

actor loss 0.003923224548622966

critic loss 24.478738112190364

score 470.32
score 470.32

actor loss 0.021880827450752257

critic loss 13.361974860575796

score 470.32
score 469.08

actor loss 0.01778064329624176

critic loss 7.730475267779826

score 468.68
score 465.88
score 459.42
score 454.84

actor loss 0.01946212862730026

critic loss 5.1347520150780674

score 450.82
score 444.44
score 437.88
score 432.74

actor loss 0.0015870026171207429

critic loss 4.184067021465301

score 425.68
score 422.58
score 417.76
score 412.26

actor loss 0.0007108245670795442

critic loss 3.259558057948947

score 408.8
score 403.54
score 399.58

actor loss 0.012875588369369506

critic loss 0.8771189509637655

score 395.9
score 390.52
score 385.46
score 383.14

actor loss 0.01731093973144889

critic loss 1.5695805805414913

score 381.48
score 381

score 334.8

actor loss 0.0014888299465179442

critic loss 10.003066374567151

score 338.3
score 341.88

actor loss 0.004528905673418193

critic loss 9.32098937585354

score 345.4
score 349.9

actor loss 0.002353140741959214

critic loss 8.300078028547764

score 354.22
score 358.54

actor loss 0.0017393132448196408

critic loss 10.000532776679098

score 362.56
score 365.56

actor loss 0.002363408315181732

critic loss 10.927337845613064

score 368.92
score 373.8

actor loss 0.002262704050540924

critic loss 17.62735381180793

score 378.04
score 381.88

actor loss 0.0001724137343466281

critic loss 15.21647298642248

score 385.0
score 388.46

actor loss 0.000760043179988861

critic loss 18.657961905200782

score 391.86
score 395.38

actor loss 0.0009011699438095093

critic loss 20.483803695496913

score 398.96
score 402.16

actor loss 0.0006426054477691649

critic loss 18.752785399854183

score 406.08
score 410.16

actor loss 0.009153662705421449

critic loss 16.196726959711317

score 4


actor loss 0.004326067399978637

critic loss 0.18887769522033632

score 463.92
score 462.76

actor loss 0.0026363467454910278

critic loss 0.2706735446594655

score 460.76
score 459.3
score 459.02

actor loss 0.0030540219509974124

critic loss 1.9354992020368578

score 458.22
score 457.6

actor loss 0.004572709390614182

critic loss 0.5620068561602384

score 456.68
score 455.78

actor loss 0.006755309799313545

critic loss 0.5676276204474269

score 454.98
score 453.38

actor loss 0.02108170828567818

critic loss 0.41573008066862815

score 451.5
score 449.64
score 448.3

actor loss -0.00178929318189621

critic loss 0.6094029770120979

score 446.6
score 444.36

actor loss -0.0018542224735021591

critic loss 0.5759868503749371

score 442.02
score 440.6

actor loss 0.0036737200140953075

critic loss 0.1688082833468914

score 439.72
score 437.44
score 435.82

actor loss -0.0026829456984996795

critic loss 0.08858275716491046

score 435.7
score 435.44

actor loss 0.005516854186588898

criti

critic loss 17.976972481158377

score 487.12
score 487.12

actor loss -0.005127015680074691

critic loss 21.383314272453266

score 487.12
score 487.12

actor loss -0.0021528126120567317

critic loss 15.000107211200893

score 487.12
score 487.12

actor loss -0.003628954589366913

critic loss 22.913991051689347

score 487.12
score 487.12

actor loss 0.008624459362030028

critic loss 34.938279367334765

score 487.12
score 487.12

actor loss -0.0006710207462310791

critic loss 26.752408823285993

score 487.12
score 489.52

actor loss -0.007395188900828362

critic loss 32.07712152662948

score 490.78
score 492.12

actor loss -0.0027557032287120822

critic loss 39.62814997347929

score 492.12
score 492.12

actor loss -0.0028784061193466185

critic loss 26.944264983016257

score 492.12
score 492.5

actor loss 0.0017117379441857338

critic loss 13.472388394277544

score 494.2
score 494.52

actor loss -0.002104052019119263

critic loss 25.24366112055555

score 494.52
score 496.0

actor loss -0.

critic loss 35.86910278374701

score 500.0
score 500.0

actor loss -0.001565406060218811

critic loss 38.79076383199693

score 500.0
score 500.0

actor loss -0.0006592664241790771

critic loss 36.45763189128041

score 500.0
score 500.0

actor loss -0.004231661295890808

critic loss 23.462782824951407

score 500.0
score 500.0

actor loss -0.00026129351854324334

critic loss 37.369429198193544

score 500.0
score 500.0

actor loss -0.000371114057302475

critic loss 30.21521508206129

score 500.0
score 500.0

actor loss -0.0024697948202490804

critic loss 35.59623317098841

score 500.0
score 500.0

actor loss 0.00440630407333374

critic loss 23.26073683100939

score 500.0
score 500.0

actor loss 0.004374129629135132

critic loss 27.870390957483647

score 500.0
score 500.0

actor loss 0.0025840553402900696

critic loss 26.29827570819259

score 500.0
score 500.0

actor loss 0.0023108743906021115

critic loss 38.05053273607492

score 500.0
score 500.0

actor loss 0.00239630465079099

critic l


actor loss -0.0039928128421306604

critic loss 23.54896927828863

score 444.06
score 453.8

actor loss -0.004888961875438689

critic loss 39.61421872808934

score 453.8
score 453.8

actor loss -0.0015914812505245211

critic loss 40.168839906764035

score 453.8
score 458.66

actor loss 0.02140813391804695

critic loss 39.76117640830278

score 458.66
score 458.66

actor loss -0.00037436015605926513

critic loss 38.8251344553709

score 462.38
score 466.22

actor loss 0.002414119757560548

critic loss 33.69211813237668

score 466.22
score 475.78

actor loss 0.0015311837941408154

critic loss 29.064966550350185

score 480.0
score 482.32

actor loss 0.006674608955159783

critic loss 30.838519308638574

score 482.32
score 482.32

actor loss -0.0010252897918224333

critic loss 38.05665153474808

score 482.32
score 473.42
score 473.42

actor loss -0.0009148414164781571

critic loss 55.062252113223074

score 473.42
score 473.42

actor loss -0.0009875748336315156

critic loss 39.31898253464401



critic loss 20.25979000489712

score 367.36
score 374.82

actor loss 0.006138336437940599

critic loss 19.22824078035355

score 383.04
score 391.76

actor loss -0.0007564717270433903

critic loss 6.999974347400665

score 398.94
score 408.2

actor loss 0.008152737957239151

critic loss 4.84067121796012

score 416.72
score 418.28
score 427.46

actor loss -0.0018492228388786315

critic loss 40.24221441960335

score 434.0
score 440.86

actor loss 5.321848560124635e-05

critic loss 5.104608310222625

score 444.76
score 453.44

actor loss -0.00034764727503061295

critic loss 18.565978528160606

score 457.84
score 464.42

actor loss -0.00018272670209407808

critic loss 10.87861107978821

score 472.22
score 474.96

actor loss 0.0070179462981410316

critic loss 3.544849450649321

score 475.04
score 481.28

actor loss 0.00342501423060894

critic loss 18.921233550670742

score 481.28
score 481.28

actor loss 0.00033591758832335464

critic loss 16.304790610709787

score 481.28
score 481.28

actor 

score 495.46

actor loss -0.0018039761900901792

critic loss 41.71498121539354

score 495.46
score 495.46

actor loss -0.001596578735113144

critic loss 38.76840151533783

score 495.46
score 495.46

actor loss -0.0019065836846828461

critic loss 39.28803358534575

score 495.46
score 495.46

actor loss -0.0019368939965963363

critic loss 37.82078864924311

score 495.46
score 495.46

actor loss -0.002020047450065613

critic loss 33.78922585386037

score 495.46
score 495.46

actor loss -0.005875581585615873

critic loss 31.903393624527745

score 495.46
score 495.46

actor loss -0.0015277754426002504

critic loss 37.172072417765854

score 493.44
score 484.26
score 477.16
score 470.1
score 460.88
score 457.6
score 451.4
score 441.96

actor loss 0.00035242681503295896

critic loss 142.5398458459854

score 435.0
score 435.0
score 426.62
score 418.92
score 410.3

actor loss -0.0029942973256111144

critic loss 92.17293765707015

score 410.3
score 410.3

actor loss -0.0018700564086437225

critic


actor loss 0.00030031872242689125

critic loss 33.98093729227781

score 500.0
score 500.0

actor loss 0.008007947242259979

critic loss 35.029311310166115

score 500.0
score 500.0

actor loss -0.00011315441131591797

critic loss 32.89365652680397

score 500.0
score 500.0

actor loss -0.0011383233964443206

critic loss 33.4197972512424

score 500.0
score 500.0

actor loss 0.0018893880788236853

critic loss 34.24153888967335

score 500.0
score 500.0

actor loss -0.0006572304544039069

critic loss 33.1750108996272

score 500.0
score 500.0

actor loss 0.00035866029858589175

critic loss 32.59979473522305

score 500.0
score 500.0

actor loss 0.0006958356738090516

critic loss 33.31271326838136

score 500.0
score 500.0

actor loss -0.0011371000975370408

critic loss 33.72034315853715

score 500.0
score 500.0

actor loss 0.0003543764233589172

critic loss 31.96967911533117

score 500.0
score 500.0

actor loss 0.0001544227719306946

critic loss 33.484270798057324

score 500.0
score 500.0

act

critic loss 27.90723638781309

score 500.0
score 500.0

actor loss 0.0006395201802253723

critic loss 36.85106071946323

score 500.0
score 500.0

actor loss 0.0015807607457041743

critic loss 31.03187016470283

score 500.0
score 500.0

actor loss 0.006272837185859681

critic loss 16.085838192147015

score 500.0
score 500.0

actor loss 0.00015248592495918273

critic loss 16.37624663097858

score 500.0
score 500.0

actor loss 0.006209738955646754

critic loss 16.23967725660205

score 500.0
score 500.0

actor loss -0.0006749230118468404

critic loss 15.386751354908942

score 500.0
score 500.0

actor loss -0.0009626066267490387

critic loss 14.332575093403458

score 500.0
score 500.0

actor loss 0.00463703973442316

critic loss 15.299399263241886

score 500.0
score 496.42
score 492.98

actor loss 0.0008651524782180786

critic loss 59.61403221199363

score 492.98
score 492.98

actor loss -0.00017418079376220705

critic loss 20.558693414668735

score 492.98
score 492.98

actor loss 0.0034016

score 468.68

actor loss 0.0012479205798823386

critic loss 12.684115787005425

score 469.68
score 470.4

actor loss 0.0027181342136580492

critic loss 15.191343216905

score 471.82
score 474.86

actor loss 0.0262485149666667

critic loss 18.79424159913957

score 476.72
score 477.88

actor loss 0.011762527215480803

critic loss 12.463726107676326

score 478.66
score 481.24

actor loss -8.617162704467772e-05

critic loss 19.085375507724287

score 482.58
score 482.58

actor loss 0.0007241821318864823

critic loss 19.328954029351472

score 483.46
score 484.48

actor loss 0.0012791234493255616

critic loss 14.228517346286774

score 486.06
score 489.26
score 481.88

actor loss -0.0016523623615503312

critic loss 38.983785366308695

score 477.8
score 472.28
score 468.82
score 460.54
score 452.64
score 444.68

actor loss 0.12106251616477967

critic loss 113.53009676028492

score 444.68
score 444.68

actor loss 0.0008733553139958532

critic loss 13.763548216855526

score 444.68
score 444.68

a

score 476.84
score 471.66
score 465.2
score 458.72

actor loss -0.006855523049831391

critic loss 113.80638550736903

score 458.72
score 465.44

actor loss 0.0023131510682404045

critic loss 51.152548280844094

score 458.66
score 452.24
score 453.16
score 446.18
score 440.08
score 433.22

actor loss -0.010924043920636176

critic loss 108.34273181978763

score 426.66
score 419.86
score 414.62
score 407.72
score 401.2
score 394.7

actor loss -0.0015416268467903136

critic loss 90.06987667912841

score 388.28
score 381.98
score 377.0
score 370.52
score 364.68

actor loss -0.004560238718986512

critic loss 73.27162049435375

score 357.82
score 351.56
score 345.48
score 339.34
score 332.76
score 326.36

actor loss 0.009358364415168761

critic loss 77.54499936597645

score 320.22
score 313.5
score 307.34
score 301.58
score 295.34

actor loss -0.011368269699811934

critic loss 45.464566949748985

score 289.04
score 282.78
score 276.82
score 270.68
score 264.94

actor loss -0.00485768957138061

critic loss 17.07389224165529

score 500.0
score 500.0

actor loss 0.00011828008890151977

critic loss 25.12993199105486

score 500.0
score 500.0

actor loss 0.0023468172550201415

critic loss 26.07215422331951

score 500.0
score 500.0

actor loss -0.0005549184322357178

critic loss 16.441253945871814

score 500.0
score 500.0

actor loss 0.001927603244781494

critic loss 14.503254049904644

score 500.0
score 500.0

actor loss 0.003635729396343231

critic loss 15.620948509988187

score 500.0
score 500.0

actor loss 0.004700257223844527

critic loss 13.913034703449904

score 500.0
score 500.0

actor loss -0.0007030243873596192

critic loss 13.011917856243064

score 500.0
score 500.0

actor loss -0.0011803131192922591

critic loss 9.473427545374632

score 500.0
score 500.0

actor loss 0.0007758160829544067

critic loss 12.112998747068644

score 500.0
score 500.0

actor loss 0.00041316378712654117

critic loss 6.992092138814925

score 500.0
score 500.0

actor loss 0.000914030995965004

cri

critic loss 15.95318259601891

score 500.0
score 500.0

actor loss 0.012833075535297393

critic loss 12.521695695820451

score 500.0
score 500.0

actor loss 0.004885757541656494

critic loss 28.220895518794656

score 500.0
score 500.0

actor loss -6.081690788269043e-05

critic loss 28.08359229310751

score 500.0
score 500.0

actor loss 0.005756000113487244

critic loss 35.88666733201444

score 500.0
score 500.0

actor loss 0.008467297732830049

critic loss 42.53113812012226

score 500.0
score 500.0

actor loss 0.000510003650188446

critic loss 31.30594232539237

score 500.0
score 500.0

actor loss 0.0003594886302947998

critic loss 23.597463410919907

score 500.0
score 500.0

actor loss 2.6249098777770992e-05

critic loss 26.721395659446717

score 500.0
score 500.0

actor loss 0.001291020476818085

critic loss 27.470212843271717

score 500.0
score 500.0

actor loss 0.000988321316242218

critic loss 29.726751515720785

score 500.0
score 500.0

actor loss 0.0001675194263458252

critic lo

critic loss 37.14904368610679

score 500.0
score 500.0

actor loss -8.244239091873167e-05

critic loss 40.19301360436678

score 500.0
score 500.0

actor loss 0.0012594601869583132

critic loss 33.510149717879294

score 500.0
score 500.0

actor loss 3.232725858688351e-05

critic loss 34.15289694500863

score 500.0
score 500.0

actor loss 4.0720611810684196e-05

critic loss 38.64421237502694

score 500.0
score 500.0

actor loss 0.0013751930654048918

critic loss 33.51834381298422

score 500.0
score 500.0

actor loss 0.0003805495321750641

critic loss 17.13058975686431

score 500.0
score 500.0

actor loss -0.0010311065793037414

critic loss 30.32785051879883

score 500.0
score 500.0

actor loss 0.002098578119277954

critic loss 34.45151330320239

score 500.0
score 500.0

actor loss 0.0004085143268108368

critic loss 29.03779741157293

score 500.0
score 500.0

actor loss 2.0546644926071117e-05

critic loss 34.18142685257793

score 500.0
score 500.0

actor loss -0.0002746071815490723

criti

score 500.0

actor loss 0.0011887200474739075

critic loss 34.702153727984424

score 500.0
score 500.0

actor loss 0.03778240219950675

critic loss 43.88724877638817

score 500.0
score 500.0

actor loss -0.0002949815392494201

critic loss 47.412373999568814

score 500.0
score 500.0

actor loss 0.0001568289279937744

critic loss 32.620503861254456

score 500.0
score 500.0

actor loss -0.0020120023787021635

critic loss 33.03349642485678

score 500.0
score 500.0

actor loss 2.175199985504151e-06

critic loss 34.93976158634722

score 500.0
score 500.0

actor loss 0.0002549044072628022

critic loss 30.185787536650896

score 500.0
score 500.0

actor loss 2.601292729377748e-05

critic loss 32.131649480751165

score 500.0
score 500.0

actor loss 0.00019308158159255981

critic loss 39.36608220190406

score 500.0
score 500.0

actor loss -0.00125654786080122

critic loss 35.38134816613793

score 500.0
score 500.0

actor loss -0.00022116672992706296

critic loss 40.01118660084307

score 500.0
sco

score 327.74
score 327.46

actor loss -0.0010294623643159868

critic loss 4.81902964732796

score 328.38
score 327.98
score 326.88

actor loss -0.0020627673141658306

critic loss 2.8546800289362664

score 325.48
score 325.34
score 325.88

actor loss -0.0005236551642417908

critic loss 4.260878084430098

score 326.84
score 327.42
score 329.38

actor loss -0.006790733948780689

critic loss 2.6607242981258783

score 329.98
score 330.72

actor loss -0.0007872382700443269

critic loss 4.397832791155577

score 331.0
score 333.08
score 334.48

actor loss -0.0007365689784288407

critic loss 5.5850966038271785

score 334.66
score 336.94

actor loss 0.004556332951784134

critic loss 4.407981987064332

score 338.94
score 340.18
score 340.98

actor loss -0.004501442605257034

critic loss 2.0443045108512043

score 342.66
score 344.58

actor loss 0.002591690582036972

critic loss 6.829066689114273

score 348.06
score 350.38

actor loss -0.001006306618452072

critic loss 16.568467686516044

score 353

critic loss 30.423018278374524

score 477.2
score 477.2

actor loss 0.0016601444244384762

critic loss 22.774824539728463

score 479.38
score 479.38

actor loss 0.0003138895593583584

critic loss 19.33601366333961

score 479.38
score 479.38

actor loss 0.0015778910160064697

critic loss 20.709108640760185

score 479.38
score 480.48

actor loss 0.0006178768992424011

critic loss 22.172331010466813

score 482.66
score 484.44

actor loss 0.002664692234992981

critic loss 26.577593647332485

score 484.56
score 483.38

actor loss -0.00037649803161621086

critic loss 20.987896663590522

score 483.24
score 481.52

actor loss 3.6224424839019714e-06

critic loss 20.591007912677526

score 481.0
score 478.56
score 476.14

actor loss -0.00046940698623657224

critic loss 30.27659843168035

score 474.3
score 472.22

actor loss 0.004450602853298187

critic loss 18.403261527743933

score 470.62
score 470.62

actor loss 0.003035770094394684

critic loss 21.143957431763415

score 470.62
score 470.62

ac

score 358.74
score 358.88

actor loss 0.002251342010498047

critic loss 1.7137897452771664

score 358.38
score 358.92
score 359.4

actor loss 0.00659672673419118

critic loss 1.2754499363318086

score 359.22
score 360.28
score 359.96

actor loss 0.00725372059494257

critic loss 0.4860143672654405

score 362.1
score 363.18

actor loss 0.01583307124376297

critic loss 1.4133235484093427

score 364.38
score 366.14

actor loss 0.003445557184889912

critic loss 7.388841143316031

score 368.6
score 372.44

actor loss 0.010346703553199768

critic loss 2.2845382974565025

score 375.48
score 377.74

actor loss 0.02167645902633667

critic loss 5.0506363104052845

score 380.06
score 381.18
score 380.08

actor loss 0.0005618480086326599

critic loss 1.7183931446790695

score 378.22
score 377.74
score 377.0

actor loss 8.802947998046873e-05

critic loss 1.476448328104615

score 375.58
score 373.88
score 373.06

actor loss 0.001921232557296753

critic loss 0.9007308644410223

score 371.16
score 367.

critic loss 5.796911106225848

score 357.66
score 351.9
score 347.22
score 342.1

actor loss 7.005786895751954e-05

critic loss 4.827489016014338

score 338.7
score 334.3
score 329.68

actor loss 0.0050758917272090915

critic loss 2.223456732672453

score 325.0
score 319.3
score 314.38
score 308.66

actor loss 0.0009013457179069519

critic loss 4.493788382256031

score 303.1
score 298.28
score 292.78
score 287.52
score 281.9

actor loss 0.00144702787399292

critic loss 4.389597209677101

score 277.4
score 272.24
score 267.02
score 262.04

actor loss -0.0001627182312309742

critic loss 2.681831859754026

score 257.06
score 251.62
score 246.64
score 246.56

actor loss 0.0016365633308887482

critic loss 2.4432839882791044

score 242.3
score 238.48
score 234.88

actor loss 0.012563267576089129

critic loss 2.4528045036792756

score 235.98
score 238.12
score 240.64
score 243.08

actor loss 0.001061588108539581

critic loss 2.0610173837587236

score 245.04
score 246.52
score 248.18

actor lo


actor loss 0.012589392852783205

critic loss 1.1091842480927707

score 241.68
score 241.58
score 241.28
score 241.08
score 240.98

actor loss 0.026266338016092777

critic loss 1.942395421375334

score 241.08
score 241.14
score 241.36
score 241.42
score 241.66

actor loss 0.02360970428586006

critic loss 0.5805567164495588

score 241.74
score 241.68
score 242.04
score 242.2

actor loss 0.0017440897017717363

critic loss 0.205499105155468

score 242.7
score 242.62
score 242.42
score 241.98
score 241.66

actor loss 0.0013684810250997543

critic loss 0.7687049848452211

score 241.14
score 240.34
score 239.46
score 238.36

actor loss 0.008172218906879424

critic loss 0.12337626146823169

score 237.94
score 237.38
score 236.28
score 235.48

actor loss -0.001327036001905799

critic loss 0.13062019571214917

score 234.56
score 233.5
score 233.36
score 232.68

actor loss 0.0013924688994884492

critic loss 0.3706106752768159

score 231.12
score 230.28
score 228.7
score 226.96

actor loss 0.0019

critic loss 17.18780729894042

score 377.04
score 379.6
score 381.04
score 382.66
score 384.58

actor loss 0.0013762716829776767

critic loss 16.412262644900384

score 386.24
score 388.8
score 389.22
score 390.76

actor loss 0.0008792325284332035

critic loss 11.188207121288032

score 385.3
score 388.0
score 382.9
score 383.56

actor loss -0.00012058144807815552

critic loss 12.551781423851477

score 385.14
score 385.46
score 380.24
score 375.46

actor loss 0.00027025719881057736

critic loss 10.652999140186607

score 370.58
score 365.7
score 361.7

actor loss 0.0003586196437478066

critic loss 6.473716112299263

score 356.9
score 352.58
score 348.54
score 344.5

actor loss 0.007713070677220822

critic loss 8.210645486491547

score 344.5
score 344.5

actor loss 0.007988540172576906

critic loss 10.743553178036214

score 344.5
score 344.5

actor loss 0.007372122740745545

critic loss 12.158753152644636

score 344.5
score 344.5

actor loss 0.009732217979989946

critic loss 12.32400354869

critic loss 0.7686173961620777

score 216.48
score 216.68
score 216.86
score 217.02

actor loss 0.005582317551970482

critic loss 1.4944562364026903

score 217.06
score 217.12
score 217.32
score 217.1
score 217.36

actor loss 0.005863287552446127

critic loss 0.8156576212763786

score 217.48
score 217.56
score 217.68
score 217.58
score 217.58

actor loss -0.0015808821856975555

critic loss 1.7904875738829376

score 217.6
score 217.46
score 217.3
score 217.42
score 217.3

actor loss 0.00311356703042984

critic loss 2.4943443089276554

score 217.38
score 217.58
score 217.58
score 217.74
score 217.64

actor loss -0.00038569076582789416

critic loss 1.5374906858572273

score 217.1
score 216.7
score 216.42
score 216.2
score 215.9

actor loss 0.015393766352534293

critic loss 2.077121730667353

score 215.58
score 215.18
score 214.66
score 214.58
score 213.88

actor loss 0.007971943867206573

critic loss 2.859291788902879

score 213.3
score 212.84
score 212.26
score 211.82
score 210.9

actor 

score 370.3

actor loss 0.004678452967107296

critic loss 12.260885899373891

score 366.56
score 363.08
score 359.78

actor loss 9.562061429023742e-05

critic loss 12.826158133783935

score 356.68
score 353.16
score 349.42

actor loss 0.0008717337131500245

critic loss 12.0202384765774

score 346.04
score 345.66
score 345.54

actor loss -0.0014009272813796997

critic loss 11.441135376944766

score 345.04
score 344.52
score 344.42

actor loss 0.0005084499716758728

critic loss 11.093812058436125

score 343.06
score 342.52
score 338.6

actor loss 0.0021888136148452758

critic loss 11.048067210603506

score 338.12
score 336.04
score 335.24
score 333.88

actor loss 0.0012205649375915525

critic loss 16.660187601247987

score 332.32
score 329.86
score 328.98

actor loss 6.104709403589363e-05

critic loss 12.652230945735193

score 327.1
score 326.1
score 324.42

actor loss -0.0012750787980854513

critic loss 12.922612753461673

score 322.08
score 320.28
score 317.64
score 316.34

actor loss 

critic loss 0.668777466288954

score 303.14
score 304.14
score 305.86

actor loss 0.0023301901683211324

critic loss 0.7184599697167054

score 305.56
score 304.3
score 303.24

actor loss 0.0018676476418972017

critic loss 0.4118741879858076

score 302.7
score 303.34
score 303.44

actor loss 0.0017771911263465886

critic loss 1.3982082076728344

score 302.26
score 301.5
score 301.4

actor loss 0.006984492325037719

critic loss 0.16269156705625357

score 301.42
score 300.76
score 300.2
score 300.14

actor loss 0.005893333303928374

critic loss 0.25059568230174484

score 300.46
score 300.16
score 300.02

actor loss 0.00657446282505989

critic loss 0.13721044431626797

score 299.6
score 299.34
score 299.68
score 300.06

actor loss 0.00211858976483345

critic loss 0.11204755913205444

score 300.36
score 300.98
score 301.5

actor loss 0.00314447039142251

critic loss 0.1092111504200846

score 301.7
score 302.3
score 301.66
score 302.12

actor loss 0.0061288125932216645

critic loss 0.3120185

critic loss 0.5616322915084659

score 379.5
score 379.84
score 380.62

actor loss 0.011855719321966171

critic loss 0.33115215276628734

score 381.82
score 383.0

actor loss 0.010048212172091005

critic loss 0.678123193506524

score 385.54
score 387.66

actor loss 0.00987924497127533

critic loss 0.8875493149414659

score 389.72
score 391.14

actor loss 0.026336409172415736

critic loss 0.8648889766119421

score 392.42
score 391.52
score 389.72
score 388.7

actor loss 0.0010195673376321795

critic loss 0.62428761315234

score 388.14
score 387.38
score 386.96

actor loss 0.00044308679252862934

critic loss 0.9393400231666863

score 386.72
score 386.44
score 385.92

actor loss 0.0038207071095705037

critic loss 0.3605912026390433

score 385.38
score 384.78
score 383.7

actor loss 0.004813606190681457

critic loss 0.2746896051116288

score 382.7
score 380.68
score 378.76

actor loss 0.0005721111536026

critic loss 0.14989379645772277

score 377.18
score 375.46
score 373.9

actor loss 0.00

score 418.24

actor loss -0.00012889957427978516

critic loss 19.175712586939333

score 420.82
score 423.48

actor loss -6.531121730804444e-05

critic loss 19.402522455370427

score 426.3
score 429.12

actor loss 0.002230457925796509

critic loss 16.40257829120755

score 431.38
score 433.48

actor loss -0.0002261693060398102

critic loss 19.36223972104192

score 436.1
score 438.6

actor loss 0.0005176416635513305

critic loss 16.487004892867805

score 440.84
score 443.9

actor loss 5.598275661468505e-05

critic loss 15.10794106536135

score 446.96
score 449.5

actor loss 0.002269044780731201

critic loss 16.382989741294086

score 451.36
score 453.88

actor loss -7.619258165359499e-05

critic loss 14.514239052870124

score 456.02
score 457.66

actor loss 0.0011948567628860475

critic loss 15.584427897153796

score 460.08
score 462.3

actor loss 0.00016708091497421267

critic loss 17.289717517802863

score 464.32
score 465.86

actor loss 2.9945665597915643e-05

critic loss 12.54251794985

score 438.84

actor loss 0.000891972180455923

critic loss 0.30141968765333294

score 439.2
score 438.84
score 438.9

actor loss 0.0017466651499271392

critic loss 0.07145022912677376

score 440.34
score 440.94

actor loss 0.0008143392622470856

critic loss 0.8058134008619934

score 442.14
score 443.46

actor loss 0.021909167566895486

critic loss 0.7358621813960373

score 443.88
score 443.84

actor loss 0.0031656714558601375

critic loss 0.15501691029630604

score 442.96
score 442.36
score 441.78

actor loss 0.0050584931015968315

critic loss 0.648903529060632

score 440.26
score 440.62

actor loss 0.0066647269248962405

critic loss 0.03364133138768375

score 441.76
score 441.56
score 440.62

actor loss 0.018743502324819562

critic loss 0.687102602750808

score 438.82
score 438.02

actor loss 0.00439876454770565

critic loss 0.037596388528309765

score 435.4
score 433.18
score 431.34

actor loss 0.006888391388207673

critic loss 0.38531449989415706

score 430.28
score 429.52

actor lo

critic loss 3.4387350502386687

score 344.94
score 349.12

actor loss 0.001280831752717495

critic loss 2.760215411257744

score 353.02
score 356.96

actor loss 0.020997656377498057

critic loss 1.4276532671958206

score 360.64
score 363.6

actor loss 0.007584409311413766

critic loss 0.23255882642865178

score 366.76
score 367.72

actor loss 0.02972390441894531

critic loss 0.5424853379786014

score 369.4
score 371.54

actor loss 0.002024871981143951

critic loss 0.5652701493009925

score 379.62
score 387.4

actor loss -0.00029311225712299346

critic loss 4.956059025031328

score 396.28
score 404.4

actor loss -3.8470590114593505e-05

critic loss 7.475289062575996

score 411.28
score 413.84

actor loss -5.9593725204467784e-05

critic loss 7.471675606250763

score 421.28
score 428.9

actor loss -0.0001660089433193207

critic loss 3.8424296421840785

score 431.48
score 433.76

actor loss -0.000929937356710434

critic loss 3.1206868919968604

score 434.48
score 437.32

actor loss 0.00216

score 458.86
score 456.08

actor loss 0.019155222302675246

critic loss 1.3466308747068048

score 453.02
score 450.7
score 447.22

actor loss -0.0017356649547815323

critic loss 1.0028985751722008

score 442.82
score 438.14
score 433.46
score 428.46

actor loss -0.001215529102087021

critic loss 1.5884875007681551

score 425.04
score 421.38
score 418.58

actor loss 0.028704181826114655

critic loss 0.9749900788694621

score 415.5
score 413.1

actor loss 0.001882642126083374

critic loss 0.7163038669198751

score 410.56
score 409.52
score 407.64

actor loss 0.005360520747303962

critic loss 1.336316735753417

score 407.5
score 406.2

actor loss 0.007544035744667052

critic loss 1.308131414631009

score 405.76
score 405.68

actor loss 0.015003569102287295

critic loss 1.9666666106648745

score 404.9
score 404.12

actor loss 0.007775356668233871

critic loss 0.4675897167161107

score 402.66
score 402.56

actor loss 0.0032933708906173705

critic loss 1.6326942427888511

score 401.7
score 4

score 498.82
score 498.82

actor loss 0.00333807315826416

critic loss 4.521863609679043

score 498.82
score 498.82

actor loss 0.00017005487084388734

critic loss 3.1008387440931053

score 498.82
score 498.82

actor loss 0.0004471570611000061

critic loss 10.671549990374036

score 498.82
score 498.82

actor loss -2.075498104095459e-05

critic loss 9.560480314512176

score 498.82
score 498.82

actor loss 0.000132184636592865

critic loss 6.676988351564203

score 498.82
score 498.82

actor loss 0.0006413501612842082

critic loss 7.4116575510948906

score 498.82
score 498.82

actor loss 0.00015076583623886109

critic loss 11.547253191636875

score 498.82
score 498.82

actor loss 0.002655910181999207

critic loss 9.082486646169052

score 498.82
score 498.82

actor loss 0.0009034525394439698

critic loss 12.383201826679706

score 498.82
score 498.82

actor loss 0.00016715803295373917

critic loss 13.612966621753387

score 498.82
score 498.82

actor loss 0.0008169477462768554

critic loss 7

score 496.46

actor loss -0.0003148430109024047

critic loss 37.992152336391804

score 496.46
score 496.46

actor loss 0.0012009153246879578

critic loss 10.484770614543558

score 496.46
score 496.46

actor loss 0.0002689145773649216

critic loss 37.311620543622965

score 496.46
score 496.46

actor loss 0.00037007389068603513

critic loss 17.83888618456423

score 496.46
score 496.46

actor loss 0.001800493100937456

critic loss 18.56474103255868

score 496.46
score 496.46

actor loss 0.017363607668876645

critic loss 3.5311556023538118

score 496.46
score 496.72

actor loss 8.838481456041336e-05

critic loss 16.77616423254609

score 496.9
score 496.9

actor loss 0.0016432496786117554

critic loss 28.821143148608506

score 496.94
score 498.84

actor loss -0.0004781728863716125

critic loss 14.1445596306324

score 500.0
score 500.0

actor loss 0.0033292966615408653

critic loss 1.9454666220545764

score 500.0
score 500.0

actor loss -0.00010962443351745606

critic loss 13.208718644066156

critic loss 44.286480809187886

score 500.0
score 500.0

actor loss -7.133690565824509e-05

critic loss 43.6409899332881

score 500.0
score 500.0

actor loss 0.0010032704412937163

critic loss 42.17933505194187

score 500.0
score 500.0

actor loss 0.00015931731462478637

critic loss 42.35778659119606

score 500.0
score 500.0

actor loss 0.0007430809199810027

critic loss 43.21112073577642

score 500.0
score 500.0

actor loss 7.593977451324447e-06

critic loss 42.763931858878586

score 500.0
score 500.0

actor loss 0.0003109265565872192

critic loss 41.71504268542975

score 500.0
score 500.0

actor loss -0.0008116481840610504

critic loss 42.739434471623596

score 500.0
score 500.0

actor loss 0.00019055090546607972

critic loss 41.993099011534454

score 500.0
score 500.0

actor loss 0.0005038747549057007

critic loss 42.50320239254236

score 500.0
score 500.0

actor loss 0.0003414820045232773

critic loss 41.63240156565905

score 500.0
score 500.0

actor loss 0.0016541745126247404

cri

score 500.0
score 500.0

actor loss 0.00025238854587078096

critic loss 36.460473280125846

score 500.0
score 500.0

actor loss 0.000592555856704712

critic loss 33.531613583609456

score 500.0
score 500.0

actor loss -3.275007605552673e-05

critic loss 15.035870220653715

score 500.0
score 500.0

actor loss 0.0012255320623517038

critic loss 9.76337650600374

score 500.0
score 500.0

actor loss 0.016543646907806398

critic loss 4.283503716212511

score 500.0
score 500.0

actor loss 0.0001121811866760254

critic loss 33.74360528225451

score 500.0
score 500.0

actor loss -2.3436343669891353e-05

critic loss 28.4621590389993

score 500.0
score 500.0

actor loss 0.00014950375556945801

critic loss 27.536988238847254

score 500.0
score 500.0

actor loss 4.035865068435669e-05

critic loss 21.66958778448291

score 500.0
score 500.0

actor loss -0.0002402898550033569

critic loss 33.552283214503156

score 500.0
score 500.0

actor loss 0.0007920126438140868

critic loss 30.02051843431294

sco

critic loss 11.65794418294765

score 499.8
score 499.66

actor loss 0.006385963467881084

critic loss 8.137783709579704

score 499.66
score 499.66

actor loss 0.0036565013885498042

critic loss 5.84039617976956

score 499.66
score 499.66

actor loss 0.005316099399328232

critic loss 6.406193610256911

score 499.66
score 499.66

actor loss 0.0011238304734230038

critic loss 6.383941071610152

score 499.66
score 499.48

actor loss 0.007771063616871833

critic loss 7.2725230365484945

score 499.48
score 498.84

actor loss 0.00293688155412674

critic loss 8.066018765521049

score 497.78
score 497.08

actor loss 0.011165702986717225

critic loss 8.072637650012968

score 497.0
score 497.0

actor loss 0.008047226965427397

critic loss 6.98812004778385

score 496.66
score 496.66

actor loss 0.007326715959608555

critic loss 5.971951279753446

score 495.86
score 495.58

actor loss 0.005359541290998459

critic loss 6.537685280814768

score 494.58
score 494.58

actor loss 0.006790146771073341

cr

score 309.14

actor loss -0.0005377624332904816

critic loss 0.14829802287854252

score 311.36
score 312.5
score 313.54

actor loss 0.003329541802406311

critic loss 0.07085215595439076

score 314.66
score 315.46
score 315.76

actor loss 0.001059123945236206

critic loss 0.21067426599208267

score 316.22
score 317.52
score 319.16

actor loss 0.0015646204054355621

critic loss 0.47931975930631154

score 319.34
score 320.42
score 321.52

actor loss 0.001007241719961166

critic loss 0.07319091079663484

score 322.12
score 322.48
score 323.22

actor loss 0.015478596614301204

critic loss 0.07297159475665539

score 324.36
score 325.0
score 325.66

actor loss -1.3019335269927964e-05

critic loss 0.44579370069252333

score 326.2
score 326.62
score 327.16

actor loss 0.0009996378606185318

critic loss 0.7090060178195127

score 327.86
score 329.46
score 329.68

actor loss 0.00036372205466032035

critic loss 0.1010970602271147

score 330.56
score 331.0
score 331.44

actor loss 0.0106753860473632


actor loss 0.0009682889938354494

critic loss 0.14178803531229497

score 305.78
score 305.14
score 304.74

actor loss 0.006218689390271902

critic loss 0.15268410075204447

score 304.8
score 304.78
score 304.82
score 305.2

actor loss 0.015130079405568538

critic loss 0.309295116943866

score 305.36
score 305.04
score 305.86

actor loss 0.027774061387777334

critic loss 0.7554546782121062

score 305.6
score 305.46
score 304.74

actor loss 0.0024683426856994626

critic loss 0.13107068892791865

score 303.98
score 304.94
score 305.98

actor loss 0.003250646495819092

critic loss 0.12018434378504754

score 305.8
score 306.52
score 307.02

actor loss 0.007476498109102249

critic loss 0.12447555365748701

score 307.08
score 308.68

actor loss 0.0005851514577865599

critic loss 0.27115703774988653

score 310.64
score 312.66
score 315.16

actor loss 0.0016112618207931519

critic loss 0.3896932801309973

score 316.84
score 318.3
score 319.42

actor loss 0.004015192174911499

critic loss 0.109

critic loss 0.01751579689690843

score 428.96
score 429.86

actor loss 0.006160786764323712

critic loss 0.8713219153933226

score 429.88
score 431.94

actor loss 0.0035123557567596437

critic loss 0.3853710101741831

score 432.18
score 433.68

actor loss 0.0009695219457149504

critic loss 0.38995740760751074

score 434.56
score 433.72
score 434.64

actor loss 0.001025108915567398

critic loss 0.2702128295789473

score 436.62
score 438.26

actor loss -2.5314295291900634e-05

critic loss 1.9911945821005852

score 439.0
score 440.04

actor loss 0.0021023191392421725

critic loss 2.1300658155284817

score 441.78
score 443.42

actor loss 0.0008293417155742645

critic loss 0.03500382020547986

score 444.14
score 445.44

actor loss 0.0018803506925702095

critic loss 3.055697165867128

score 446.36
score 447.14

actor loss -1.7079198360443085e-05

critic loss 0.1385921912387013

score 448.92
score 451.02
score 451.32

actor loss 0.0011549937665462494

critic loss 0.0885530366643332

score 450

critic loss 23.886632038786264

score 500.0
score 500.0

actor loss 5.466032028198238e-06

critic loss 7.882310286103842

score 500.0
score 500.0

actor loss 0.000276352196931839

critic loss 8.161755649253726

score 500.0
score 500.0

actor loss -0.0006878172159194946

critic loss 7.485669328442496

score 500.0
score 500.0

actor loss 0.000544302561879158

critic loss 2.898014036758803

score 500.0
score 500.0

actor loss 0.0015800366863608362

critic loss 6.946779345769341

score 500.0
score 500.0

actor loss -4.581792354583739e-05

critic loss 8.588264888226615

score 500.0
score 500.0

actor loss 8.836361169815062e-05

critic loss 13.653666802429408

score 500.0
score 500.0

actor loss -6.686220169067384e-05

critic loss 24.83942510834634

score 500.0
score 500.0

actor loss -0.0002966066360473633

critic loss 20.74307983605862

score 500.0
score 500.0

actor loss -0.0002932274580001831

critic loss 22.64958426172398

score 500.0
score 500.0

actor loss 0.00028745182752609255

crit

critic loss 1.8466227394522168

score 472.0
score 470.42

actor loss 0.00733974437713623

critic loss 1.709508681011759

score 468.6
score 467.1

actor loss 0.009524039563164114

critic loss 1.9584721578855067

score 466.32
score 464.94
score 463.22

actor loss 0.007194064879417421

critic loss 1.783717120599933

score 461.1
score 459.36

actor loss 0.01696307544708252

critic loss 1.2414790130451323

score 458.6
score 456.58
score 454.64

actor loss 0.008912290182709693

critic loss 1.2269441441165283

score 451.96
score 450.62

actor loss 0.006836509144306183

critic loss 0.8210844915710389

score 447.58
score 444.78
score 442.28

actor loss 0.007318428981304169

critic loss 0.665903927925229

score 440.54
score 438.56

actor loss 0.001569923546910286

critic loss 0.5810458891929128

score 437.4
score 435.42
score 434.08

actor loss -0.001316282892227173

critic loss 0.5104714783961884

score 432.96
score 431.64

actor loss 0.007820096588134765

critic loss 0.3940999480202794

score 

critic loss 3.5690854248687627

score 497.48
score 498.58

actor loss 0.001317870280891657

critic loss 9.933965043220297

score 500.0
score 499.98

actor loss -0.0006635860115289688

critic loss 4.307755440297723

score 499.98
score 499.98

actor loss 0.00537615118920803

critic loss 3.6687711851418023

score 499.98
score 499.04
score 498.26

actor loss 0.0023977009296417234

critic loss 4.272293464550376

score 497.94
score 497.94

actor loss -0.00032104137986898424

critic loss 2.855942800857127

score 497.94
score 497.94

actor loss 5.186645984649658e-05

critic loss 3.0443790391966705

score 497.66
score 496.92

actor loss 0.0017266246929764748

critic loss 0.23021047513782977

score 496.54
score 496.54

actor loss 0.003969009113311767

critic loss 1.65468696359843

score 496.32
score 495.34

actor loss 0.0035578270465135577

critic loss 0.2490573342703283

score 494.16
score 494.16

actor loss -0.0023001986145973208

critic loss 6.849269661446661

score 494.16
score 494.16

actor

score 500.0
score 500.0

actor loss 0.015040563076734542

critic loss 1.3369691842139233

score 500.0
score 500.0

actor loss 0.002907242965698242

critic loss 30.6796323649697

score 500.0
score 500.0

actor loss 0.0003921894550323486

critic loss 40.67911888929643

score 500.0
score 500.0

actor loss 0.0004996900558471679

critic loss 20.25037511943467

score 500.0
score 500.0

actor loss -0.0007179974794387818

critic loss 14.42651359745525

score 500.0
score 500.0

actor loss 0.005925065475702286

critic loss 14.233338237100842

score 500.0
score 500.0

actor loss -0.0005059359550476075

critic loss 25.44820920290053

score 500.0
score 500.0

actor loss 0.001258146905899048

critic loss 31.37171634098366

score 500.0
score 500.0

actor loss 3.82633924484253e-05

critic loss 38.305538322247564

score 500.0
score 500.0

actor loss 0.0005959276914596557

critic loss 42.02776755634174

score 500.0
score 500.0

actor loss 0.0002935849685221911

critic loss 39.0413578754887

score 500.0


critic loss 10.344415173682572

score 500.0
score 500.0

actor loss 0.003243375644087791

critic loss 2.909633004489541

score 500.0
score 500.0

actor loss 0.014645716631412505

critic loss 3.8585423382818704

score 500.0
score 500.0

actor loss -1.0372385382652266e-06

critic loss 16.745961040335892

score 500.0
score 500.0

actor loss 0.00030106118768453597

critic loss 18.25528026497662

score 500.0
score 500.0

actor loss 0.00021955768764019015

critic loss 10.022315710407495

score 500.0
score 500.0

actor loss 0.001388567715883255

critic loss 26.24842603901923

score 500.0
score 500.0

actor loss 0.002525975823402405

critic loss 35.001368424791096

score 500.0
score 500.0

actor loss 5.261042416095734e-05

critic loss 20.50858052680045

score 500.0
score 500.0

actor loss 0.0003110427513718605

critic loss 17.0869572934866

score 500.0
score 500.0

actor loss 0.0008729586601257325

critic loss 19.687177264511586

score 500.0
score 500.0

actor loss 0.0002357723712921143

criti


actor loss 0.0009820120003074407

critic loss 34.246938569629194

score 500.0
score 500.0

actor loss -1.941848993301391e-05

critic loss 34.561431723137204

score 500.0
score 500.0

actor loss 0.0024669628888368605

critic loss 34.88561185379028

score 500.0
score 500.0

actor loss 0.0006308394551277161

critic loss 34.23580686199666

score 500.0
score 500.0

actor loss 0.000257567709684372

critic loss 33.58098332749604

score 500.0
score 500.0

actor loss 0.0004459386765956879

critic loss 32.45686753590107

score 500.0
score 500.0

actor loss 0.0005183205008506775

critic loss 32.452879914760594

score 500.0
score 500.0

actor loss -5.769055783748627e-05

critic loss 31.55691246267557

score 500.0
score 500.0

actor loss 0.0009660943150520326

critic loss 30.56715508161485

score 500.0
score 500.0

actor loss 0.0009792896389961244

critic loss 31.420975883150096

score 500.0
score 500.0

actor loss 0.0007313169956207274

critic loss 31.360230095601082

score 500.0
score 500.0

act

score 500.0
score 500.0

actor loss 0.0002451653480529785

critic loss 32.13971829971895

score 500.0
score 500.0

actor loss 0.0031932367008179426

critic loss 33.52264193071425

score 500.0
score 500.0

actor loss 0.0002869520425796509

critic loss 29.941870751249787

score 500.0
score 500.0

actor loss 0.00040042344331741334

critic loss 29.30212063900232

score 500.0
score 500.0

actor loss 0.000716937880218029

critic loss 26.06256414551437

score 500.0
score 500.0

actor loss 0.00014072729349136353

critic loss 29.41835999195576

score 500.0
score 500.0

actor loss 0.0010173964500427245

critic loss 27.65683422119916

score 500.0
score 500.0

actor loss 0.0005012897849082946

critic loss 26.8012899724558

score 500.0
score 500.0

actor loss 0.001955878272652626

critic loss 23.228132018107175

score 500.0
score 500.0

actor loss 0.009560454916954042

critic loss 27.050210443496706

score 500.0
score 500.0

actor loss 0.0002653094172477723

critic loss 39.21768346289695

score 500

score 500.0
score 500.0

actor loss 0.0008113425582647323

critic loss 27.69029142751694

score 500.0
score 500.0

actor loss 0.00034693415462970734

critic loss 24.32597885541916

score 500.0
score 500.0

actor loss 0.0008347387830726803

critic loss 28.159957642281057

score 500.0
score 500.0

actor loss 0.0004235199451446533

critic loss 34.542224427723895

score 500.0
score 500.0

actor loss 0.0004907981276512147

critic loss 35.562707905972005

score 500.0
score 500.0

actor loss 0.0003394815295934677

critic loss 34.80775123467147

score 500.0
score 500.0

actor loss 0.0005561981109902263

critic loss 36.14205176922083

score 500.0
score 500.0

actor loss 0.002084988653659821

critic loss 36.362445656108854

score 500.0
score 500.0

actor loss 0.0006663871765136719

critic loss 40.253877992129325

score 500.0
score 500.0

actor loss 0.005292098939418793

critic loss 41.162791239988806

score 500.0
score 500.0

actor loss -0.0005549493342638016

critic loss 29.166527663850786

sco

critic loss 18.804085390987993

score 500.0
score 500.0

actor loss 0.0002694488525390625

critic loss 22.47996078580469

score 500.0
score 500.0

actor loss 0.002448595213890076

critic loss 22.129790201726557

score 500.0
score 500.0

actor loss 0.0007180046439170838

critic loss 10.737880274367331

score 500.0
score 500.0

actor loss -0.00012672058343887328

critic loss 13.619603249269721

score 500.0
score 500.0

actor loss 0.0045628268420696266

critic loss 14.24008193655014

score 500.0
score 500.0

actor loss 0.003723250333964824

critic loss 7.2663756095528615

score 500.0
score 500.0

actor loss 0.015856504559516905

critic loss 4.77517447398901

score 500.0
score 500.0

actor loss 0.0038090822488069534

critic loss 7.040609952443839

score 500.0
score 500.0

actor loss 0.0014800388753414152

critic loss 7.735617193298042

score 500.0
score 500.0

actor loss 0.0018674304932355882

critic loss 4.938398193535209

score 500.0
score 500.0

actor loss 0.014859170791506768

critic l

critic loss 20.427993141400815

score 500.0
score 500.0

actor loss 0.0007373259305953979

critic loss 16.008712393212317

score 500.0
score 500.0

actor loss 0.001188701444864273

critic loss 27.351001627564433

score 500.0
score 500.0

actor loss 0.0008944370090961456

critic loss 25.636978774142268

score 500.0
score 500.0

actor loss 0.0007300808787345886

critic loss 26.662399729704855

score 500.0
score 500.0

actor loss 0.0015736101001501083

critic loss 22.07603893698454

score 500.0
score 500.0

actor loss 0.00013057987391948699

critic loss 24.540251457649468

score 500.0
score 500.0

actor loss 0.0021305307149887083

critic loss 24.44962760334015

score 500.0
score 500.0

actor loss 0.00038875201456248763

critic loss 9.603905888783931

score 500.0
score 500.0

actor loss 0.0077785282373428345

critic loss 6.723186485099792

score 500.0
score 500.0

actor loss 0.0074126984119415274

critic loss 9.379218608796595

score 500.0
score 500.0

actor loss 0.005433495140075683

crit

critic loss 1.7024506150104106

score 500.0
score 500.0

actor loss 4.386901855465302e-09

critic loss 4.799415116035194

score 500.0
score 500.0

actor loss 0.0013948618561029434

critic loss 3.459605355091393

score 500.0
score 500.0

actor loss -0.0020008715331554412

critic loss 6.424648690280319

score 500.0
score 500.0

actor loss 0.00013469667434692383

critic loss 5.200144060763717

score 500.0
score 500.0

actor loss 0.0009923483788967132

critic loss 9.807652162465454

score 500.0
score 500.0

actor loss -0.001045877194404602

critic loss 19.092163582473994

score 500.0
score 500.0

actor loss 0.0006447383642196654

critic loss 17.809036605935916

score 500.0
score 500.0

actor loss -0.001648553991317749

critic loss 20.310547393336897

score 500.0
score 500.0

actor loss 8.970370292663577e-05

critic loss 25.942674682581423

score 500.0
score 500.0

actor loss 0.00028505274057388303

critic loss 21.234418776565786

score 500.0
score 500.0

actor loss 0.0007701020121574402

c


actor loss -0.0006247340083122253

critic loss 15.656507900226117

score 500.0
score 500.0

actor loss -0.001194222855567932

critic loss 17.678197770230476

score 500.0
score 500.0

actor loss -0.0006693987369537353

critic loss 14.622071375644207

score 500.0
score 500.0

actor loss 0.002002315878868103

critic loss 7.380918466037512

score 500.0
score 500.0

actor loss 0.0009160525321960449

critic loss 5.788468568827211

score 500.0
score 500.0

actor loss 0.0009586112260818481

critic loss 5.742339699874818

score 500.0
score 500.0

actor loss 7.6772141456604e-05

critic loss 8.746380874559284

score 500.0
score 500.0

actor loss 0.001963656044006348

critic loss 10.510849783450364

score 500.0
score 500.0

actor loss 3.7949705123901364e-05

critic loss 5.785986771064996

score 500.0
score 500.0

actor loss -0.000433550214767456

critic loss 10.28232144662477

score 500.0
score 500.0

actor loss 0.001508000287413597

critic loss 14.369768982498348

score 500.0
score 500.0

actor 

critic loss 2.680423773112893

score 500.0
score 500.0

actor loss 0.002748422503471375

critic loss 3.139862287151814

score 500.0
score 500.0

actor loss 0.00475100927731255

critic loss 4.762703762802482

score 500.0
score 500.0

actor loss -0.00047884337902069093

critic loss 5.613357997043431

score 500.0
score 500.0

actor loss 0.0059826500892639165

critic loss 2.9357500496387487

score 500.0
score 500.0

actor loss 0.003552775144577026

critic loss 1.6295214814811945

score 500.0
score 500.0

actor loss 0.001953992825746536

critic loss 2.2573317855596544

score 500.0
score 500.0

actor loss 0.00829076531678438

critic loss 4.718161220599338

score 500.0
score 500.0

actor loss -0.001092201691865921

critic loss 8.97349233595282

score 500.0
score 500.0

actor loss 0.004684673927724361

critic loss 5.778313994778692

score 500.0
score 500.0

actor loss 0.0006735615342855453

critic loss 5.130795967932046

score 500.0
score 500.0

actor loss 0.002292627435922623

critic loss 3.4

score 500.0
score 500.0

actor loss 0.0007940902590751647

critic loss 30.57545044466257

score 500.0
score 500.0

actor loss 4.105081260204315e-05

critic loss 32.99956356058269

score 500.0
score 500.0

actor loss 0.00046677786558866507

critic loss 34.55252270112485

score 500.0
score 500.0

actor loss 0.00015458247661590576

critic loss 42.722944371990856

score 500.0
score 500.0

actor loss -4.5536430180072776e-05

critic loss 40.4064600225091

score 500.0
score 500.0

actor loss 0.0003643987417221069

critic loss 42.381466899365186

score 500.0
score 500.0

actor loss 0.0010995223760604856

critic loss 43.14037073978782

score 500.0
score 500.0

actor loss 0.0001314862489700317

critic loss 42.47194753746986

score 500.0
score 500.0

actor loss 0.00016362035274505616

critic loss 44.93250597007871

score 500.0
score 500.0

actor loss 0.00038542118072509764

critic loss 45.84625272520184

score 500.0
score 500.0

actor loss 0.00010074764490127564

critic loss 45.09892484716475

sc

critic loss 3.054432066088915

score 500.0
score 498.94

actor loss 0.007531803870201111

critic loss 6.972701324833929

score 498.0
score 497.38

actor loss 0.009772273441404102

critic loss 7.166402188679575

score 494.82
score 491.28
score 488.5

actor loss 0.008102201652526857

critic loss 7.890243960750103

score 484.72
score 481.42
score 478.5

actor loss 0.0034043973803520207

critic loss 5.1860430234745145

score 475.98
score 473.64
score 471.36

actor loss 0.012998434042930603

critic loss 3.695226845785976

score 470.32
score 469.6

actor loss 0.0034995941430330272

critic loss 3.1330021276421847

score 468.04
score 465.6

actor loss 0.003612672185897827

critic loss 2.4516141909360885

score 464.26
score 462.02
score 459.16

actor loss 0.009869404023885727

critic loss 1.700369341826439

score 457.44
score 457.44

actor loss 0.00497847146987915

critic loss 1.214916468244791

score 457.44
score 455.46

actor loss 0.004814914594590664

critic loss 1.211333771339059

score 455

actor loss 0.009854034340381623

critic loss 2.3467896738052363

score 490.4
score 490.4

actor loss 0.002924017110271962

critic loss 22.144659498000145

score 491.5
score 492.02

actor loss 0.00017588670551776884

critic loss 24.432108225625008

score 492.02
score 492.9

actor loss 0.003474245262145996

critic loss 25.343417979119344

score 495.32
score 497.48

actor loss 2.099312543869019e-05

critic loss 25.17570513224155

score 497.48
score 499.36

actor loss 0.01112825677394867

critic loss 2.545886771170423

score 499.94
score 499.7

actor loss 0.012888234567642213

critic loss 4.125467837262899

score 499.7
score 499.7

actor loss -0.0006602732758969068

critic loss 3.88361013572365

score 499.7
score 499.7

actor loss 0.00032427225112915037

critic loss 7.62099498324357

score 499.7
score 499.7

actor loss 4.828030318021774e-05

critic loss 3.029282025797851

score 499.7
score 499.7

actor loss 0.002831990221142769

critic loss 3.220139939871431

score 499.7
score 499.7

actor

critic loss 3.7384069797798993

score 495.28
score 495.28

actor loss -0.0005216331720352173

critic loss 14.636012310996652

score 495.28
score 495.28

actor loss 9.538873434066777e-05

critic loss 14.777050970402362

score 495.28
score 495.28

actor loss 8.79931926727295e-05

critic loss 16.94890479308069

score 495.28
score 495.28

actor loss -0.0005348371267318725

critic loss 21.512743108350037

score 495.28
score 495.28

actor loss -0.0006532004028558731

critic loss 6.419814079369606

score 495.28
score 495.28

actor loss -0.0006912378668785096

critic loss 21.037066108045913

score 495.28
score 495.28

actor loss 0.0011363293655216693

critic loss 11.379233374902608

score 495.28
score 495.28

actor loss 0.0001261461853981018

critic loss 18.49821022363603

score 495.28
score 495.28

actor loss -0.0004715236663818359

critic loss 26.565665149929373

score 495.28
score 495.28

actor loss 0.00043526260256767274

critic loss 19.59484711245298

score 495.28
score 495.28

actor loss

score 473.22

actor loss 8.266199827194212e-05

critic loss 16.720328549542465

score 475.18
score 476.38

actor loss 0.004376661587506533

critic loss 0.33484164018742735

score 479.02
score 481.46

actor loss -0.00014473819434642792

critic loss 34.482698468890035

score 483.78
score 486.06

actor loss -0.0030661270737648008

critic loss 15.204860637373477

score 487.9
score 488.8

actor loss -0.0002489461064338684

critic loss 37.883232657280566

score 490.46
score 491.78

actor loss 8.900527954101561e-05

critic loss 45.6729373913154

score 491.78
score 492.76

actor loss -0.0005176616430282593

critic loss 43.32081355002224

score 492.96
score 493.98

actor loss -0.00016789176464080812

critic loss 9.646052774639054

score 493.98
score 494.16

actor loss 0.001523773992061615

critic loss 43.390649319523575

score 494.16
score 494.84

actor loss -1.293469667434692e-05

critic loss 43.244478313411776

score 494.84
score 494.84

actor loss 0.00038536617755889895

critic loss 44.05635

score 500.0
score 500.0

actor loss 0.0010806073904037477

critic loss 40.290763690459734

score 500.0
score 500.0

actor loss -5.480690002441402e-05

critic loss 40.74632841457278

score 500.0
score 500.0

actor loss 4.622006416320803e-06

critic loss 38.29524778600931

score 500.0
score 500.0

actor loss 0.00014074261188507078

critic loss 38.64757126467227

score 500.0
score 500.0

actor loss -3.85224461555481e-05

critic loss 39.22429474321007

score 500.0
score 500.0

actor loss 0.00023669182062149055

critic loss 38.54575652503371

score 500.0
score 500.0

actor loss 0.0011340250730514528

critic loss 37.8903502843976

score 500.0
score 500.0

actor loss -0.0008464493632316589

critic loss 37.816488932180405

score 500.0
score 500.0

actor loss 7.6095581054687505e-06

critic loss 37.35739951614738

score 500.0
score 500.0

actor loss 4.4579219818115236e-05

critic loss 36.51410261887311

score 500.0
score 500.0

actor loss 0.0026363684773445134

critic loss 36.52855267838835

sco

critic loss 29.085063093018533

score 500.0
score 500.0

actor loss -0.00026917492747306824

critic loss 32.71462153254747

score 500.0
score 500.0

actor loss -3.1347799301147456e-05

critic loss 32.590674589586264

score 500.0
score 500.0

actor loss 0.00046150585561990736

critic loss 32.621403173303605

score 500.0
score 500.0

actor loss 0.0001056420922279358

critic loss 33.67598744354248

score 500.0
score 500.0

actor loss 0.00511875835955143

critic loss 32.54342854012251

score 500.0
score 500.0

actor loss -0.0010457355231046675

critic loss 37.05957189365402

score 500.0
score 500.0

actor loss 0.003917209587991239

critic loss 23.696176822149752

score 500.0
score 500.0

actor loss -3.635716438293457e-05

critic loss 35.81442779456377

score 500.0
score 500.0

actor loss 0.0005682165265083313

critic loss 36.19681954874992

score 500.0
score 500.0

actor loss 0.0023354999065399165

critic loss 35.0848539860487

score 500.0
score 500.0

actor loss -0.0001667018294334412

cr

score 500.0

actor loss -0.0002791476249694824

critic loss 42.234455757573244

score 500.0
score 500.0

actor loss -5.0378084182739255e-05

critic loss 42.58220361504554

score 500.0
score 500.0

actor loss -3.481173515319825e-05

critic loss 42.53135587773919

score 500.0
score 500.0

actor loss -0.0006453025102615358

critic loss 42.832546415030954

score 500.0
score 500.0

actor loss -2.0021605491638186e-05

critic loss 40.958996576279404

score 500.0
score 500.0

actor loss -0.0008625030994415283

critic loss 40.61188821659386

score 500.0
score 500.0

actor loss -0.00043827705383300787

critic loss 42.81605137314499

score 500.0
score 500.0

actor loss -2.6155710220336907e-05

critic loss 42.17627931667268

score 500.0
score 500.0

actor loss -2.1198248863220216e-05

critic loss 40.93940255006552

score 500.0
score 500.0

actor loss 0.0001369457960128784

critic loss 43.05534245162606

score 500.0
score 500.0

actor loss 0.0004173794984817504

critic loss 41.708585593998436

scor

critic loss 39.58028189676479

score 498.32
score 498.32

actor loss -0.0008295381307601927

critic loss 39.189234184086324

score 498.32
score 498.32

actor loss 0.00163478946685791

critic loss 39.06274471304416

score 498.32
score 498.32

actor loss 0.0001401260554790497

critic loss 41.90907727996782

score 498.32
score 498.32

actor loss -0.00022305311560630797

critic loss 39.18609090006426

score 498.32
score 498.32

actor loss 0.00013069390058517455

critic loss 39.84080805485248

score 498.32
score 498.32

actor loss -1.5592193603515627e-05

critic loss 36.08677711374611

score 498.32
score 498.32

actor loss 0.002045118165016174

critic loss 34.973653874954586

score 498.32
score 498.32

actor loss 0.008677990394830703

critic loss 25.358312002268434

score 498.32
score 498.32

actor loss -4.109787940979004e-06

critic loss 38.907183526188085

score 498.32
score 498.32

actor loss 0.0005949018836021423

critic loss 38.2665100301601

score 498.32
score 498.32

actor loss 7.056

critic loss 40.569684065699576

score 500.0
score 500.0

actor loss -3.362438678741455e-05

critic loss 39.31503255180418

score 498.3
score 498.3

actor loss 0.00011362421512603757

critic loss 43.77207353301328

score 498.3
score 498.3
score 491.92

actor loss -0.00013707957267761233

critic loss 64.94974432713687

score 486.86
score 486.86

actor loss -0.00026482903063297273

critic loss 43.075533723126355

score 486.86
score 486.86

actor loss 0.00012030889540910721

critic loss 41.13101880628392

score 486.86
score 486.86

actor loss 0.0006857921499642544

critic loss 43.35169814538359

score 486.86
score 486.86

actor loss -6.805452108383177e-05

critic loss 42.3582253949523

score 486.86
score 486.86

actor loss -5.7775616645812986e-05

critic loss 41.62630680110455

score 486.86
score 486.86

actor loss 0.00013412150740623474

critic loss 41.26035498172343

score 486.86
score 486.86

actor loss 0.0010367509603500364

critic loss 38.63071291353703

score 486.86
score 486.86

act

score 500.0
score 500.0

actor loss -7.410343885421754e-05

critic loss 39.61411150292159

score 500.0
score 500.0

actor loss -0.0007076508939266205

critic loss 38.319359734678265

score 500.0
score 500.0

actor loss -0.00017387357354164124

critic loss 38.94935246109963

score 500.0
score 500.0

actor loss 0.0018491254180669787

critic loss 38.64732089646161

score 500.0
score 500.0

actor loss 0.00033554173707962034

critic loss 39.7572740624398

score 500.0
score 500.0

actor loss -0.0008369360208511352

critic loss 39.792796214982864

score 500.0
score 500.0
score 495.0

actor loss 8.175582587718964e-05

critic loss 58.28094547080398

score 495.0
score 495.0

actor loss 0.0007580214500427247

critic loss 39.617236271136996

score 495.0
score 488.22

actor loss 0.0005116033315658569

critic loss 36.6787804038927

score 488.22
score 488.22

actor loss 0.0022236013382673264

critic loss 36.99598558635414

score 488.22
score 488.22

actor loss 0.0006938730180263519

critic loss 37.09

critic loss 36.479244182646276

score 500.0
score 500.0

actor loss 0.00010056252479553223

critic loss 38.95803985976577

score 500.0
score 500.0

actor loss 0.0002618062734603882

critic loss 38.90757684281171

score 500.0
score 500.0

actor loss 0.000761023211479187

critic loss 38.0834534936227

score 500.0
score 500.0

actor loss 0.002277930438518524

critic loss 40.60310494038909

score 500.0
score 500.0

actor loss 0.0008390925407409667

critic loss 38.197277074348925

score 500.0
score 500.0

actor loss -0.0001254910230636597

critic loss 36.95237329339087

score 500.0
score 500.0

actor loss 0.001081404972076416

critic loss 38.155555579102035

score 500.0
score 500.0

actor loss 0.00339834771156311

critic loss 38.565889306241274

score 500.0
score 500.0

actor loss -5.5737900733947754e-05

critic loss 38.86481500868797

score 500.0
score 500.0

actor loss -2.254927158355713e-05

critic loss 37.093838120624426

score 500.0
score 500.0

actor loss 0.0008577221512794496

critic

score 500.0

actor loss 0.0006062416076660156

critic loss 41.16500029280186

score 500.0
score 500.0

actor loss -3.1608200073242214e-05

critic loss 41.380266180222485

score 500.0
score 500.0

actor loss 0.0008355119347572326

critic loss 41.00593654309362

score 500.0
score 500.0

actor loss -3.730003833770752e-05

critic loss 43.94669240486026

score 500.0
score 500.0

actor loss 0.0006520366430282593

critic loss 41.424383300048106

score 500.0
score 500.0

actor loss 1.5763425827026365e-05

critic loss 45.294343230974675

score 500.0
score 500.0

actor loss -2.2608232498168942e-05

critic loss 42.65735730356276

score 500.0
score 500.0

actor loss 0.00045157878398895265

critic loss 43.398435863498975

score 500.0
score 500.0

actor loss 0.0011368844270706177

critic loss 42.52944102132618

score 500.0
score 500.0

actor loss 0.0002224318027496338

critic loss 40.353913753198086

score 500.0
score 500.0

actor loss -0.0002136002063751221

critic loss 41.29410523155034

score 500

actor loss 0.0014967981338500976

critic loss 65.14563837978841

score 383.04
score 373.28
score 373.28

actor loss 0.0021623010396957395

critic loss 47.40402119088769

score 373.28
score 373.28

actor loss 0.003963877975940704

critic loss 34.324730115282534

score 373.28
score 363.52
score 363.56
score 363.56

actor loss 0.002506742024421692

critic loss 61.00908281419278

score 363.56
score 373.32

actor loss 9.981347322463988e-05

critic loss 36.24943234678507

score 373.32
score 373.32
score 373.32
score 363.54
score 353.76
score 343.98
score 334.22

actor loss 0.0033075775146484375

critic loss 96.55859380133151

score 343.98
score 343.98
score 343.88

actor loss 0.00041653112173080446

critic loss 42.68846467780471

score 343.88
score 334.1

actor loss 0.0011651447772979737

critic loss 23.53050718635321

score 343.84
score 343.84
score 334.1

actor loss 0.0008215506374835967

critic loss 43.15740514673888

score 334.1
score 334.28
score 324.5
score 314.82
score 305.06
score 30

score 500.0
score 500.0

actor loss 0.00041729300022125244

critic loss 32.470159345789256

score 500.0
score 500.0

actor loss 0.00019666463136672972

critic loss 29.10951808231771

score 500.0
score 500.0

actor loss 0.0026275686502456666

critic loss 31.460652628326415

score 500.0
score 500.0

actor loss 0.0003687424778938294

critic loss 22.787097946065664

score 500.0
score 500.0

actor loss 0.0008657516717910767

critic loss 33.20503415911794

score 500.0
score 500.0

actor loss 0.00011686091423034669

critic loss 24.588189199585468

score 500.0
score 500.0

actor loss 0.0001329814553260803

critic loss 21.10171739976294

score 500.0
score 500.0

actor loss 0.0016457596376538274

critic loss 10.305292598609626

score 500.0
score 500.0

actor loss 0.004438533377647399

critic loss 29.58131135047451

score 500.0
score 500.0

actor loss 0.0007004023194313049

critic loss 31.231474492213135

score 500.0
score 500.0

actor loss 0.0005625132620334626

critic loss 31.229023749768736

s


actor loss 0.0004444414734840393

critic loss 25.519383123244346

score 470.42
score 470.42

actor loss -4.427535533905029e-05

critic loss 32.16412167324424

score 470.42
score 470.42

actor loss 0.0022391402721405025

critic loss 33.97682547263206

score 470.42
score 480.18

actor loss 0.00045037412643432614

critic loss 30.689181901484726

score 489.96
score 490.16

actor loss 0.001752717661857605

critic loss 35.97634999742135

score 490.16
score 490.24

actor loss 0.0006689775362610816

critic loss 23.154683501674604

score 490.24
score 490.24

actor loss 0.00018835527896881102

critic loss 19.39655117686838

score 490.24
score 490.24

actor loss 0.0006032137870788574

critic loss 24.265524866020677

score 490.24
score 490.24

actor loss 0.0009815436005592346

critic loss 23.705794954448937

score 490.24
score 490.24

actor loss 0.005824021960794926

critic loss 14.396534816224875

score 490.24
score 490.24

actor loss 0.0006584401607513427

critic loss 28.50303874842524

score 4

score 498.14
score 498.14

actor loss -6.599831581115722e-06

critic loss 18.269065861096607

score 498.08
score 498.66

actor loss 0.01905319412946701

critic loss 3.524114311417937

score 499.76
score 498.74

actor loss 0.0036481767207384107

critic loss 0.7686874897181987

score 498.08
score 497.54

actor loss -1.4956772327423095e-06

critic loss 0.6613296962302179

score 496.6
score 494.98
score 493.82

actor loss 0.01069178641885519

critic loss 1.082772447898984

score 493.82
score 493.82

actor loss 1.406886577606201e-05

critic loss 8.540031532756053

score 493.82
score 493.82

actor loss 0.004904518914222717

critic loss 0.9589243619713932

score 493.82
score 493.82

actor loss -1.4245405793190002e-06

critic loss 1.435472253068164

score 493.82
score 493.8

actor loss 0.0012096626102924344

critic loss 2.7052353190541267

score 493.06
score 492.74

actor loss -0.0003985201299190521

critic loss 0.702170684787631

score 492.74
score 492.74

actor loss 0.00852508182525635

crit

critic loss 0.1285504982173443

score 407.18
score 407.7

actor loss 0.0035193039085716004

critic loss 1.3966817694444207

score 406.38
score 406.4

actor loss 0.004089924025535584

critic loss 0.1725325997762382

score 407.02
score 407.7

actor loss -1.5405392646789552e-05

critic loss 0.7014750991482288

score 408.46
score 410.0
score 410.16

actor loss -9.958809614181518e-06

critic loss 0.6491165237031877

score 412.16
score 412.52

actor loss -8.049454689025879e-05

critic loss 0.6810110528565942

score 413.08
score 415.02

actor loss 0.005401468276977539

critic loss 0.18329501260221004

score 416.6
score 416.72
score 417.34

actor loss 0.014367554485797884

critic loss 1.4752723319023846

score 418.08
score 421.72

actor loss 0.00026287999600172043

critic loss 7.462271249631047

score 423.66
score 423.04

actor loss 0.009620290660858153

critic loss 2.7443506077885624

score 423.94
score 425.78

actor loss -1.4558386802673338e-05

critic loss 7.858156884762645

score 426.98
sc

critic loss 3.5653668265614655

score 447.68
score 447.68

actor loss -1.3342738151550295e-05

critic loss 1.9907288083516061

score 446.3
score 446.1

actor loss 0.008278879404067994

critic loss 1.570349718561396

score 446.1
score 446.1

actor loss 0.004728871774673462

critic loss 2.5788804609730844

score 446.1
score 446.1

actor loss 0.0025824059009552

critic loss 3.993449800401554

score 446.1
score 446.1

actor loss 0.009776148343086244

critic loss 2.5207259571492675

score 446.1
score 446.1

actor loss 0.009461932031810285

critic loss 2.1005187669098375

score 446.1
score 446.1

actor loss 0.007166267383098603

critic loss 3.1479369083188473

score 446.1
score 446.1

actor loss 0.003066851208172739

critic loss 4.074399096295982

score 446.1
score 445.46

actor loss 0.05674031207561493

critic loss 3.2117306625388564

score 445.46
score 445.46

actor loss 0.0017212012984789908

critic loss 4.531361581254005

score 443.66
score 453.42

actor loss 0.0009109488546848296

criti

critic loss 2.368244713049382

score 494.42
score 494.42

actor loss -2.282273769378662e-05

critic loss 10.522062777478247

score 494.42
score 494.42

actor loss 4.5357644557952796e-07

critic loss 1.4016939401453827

score 494.42
score 493.24

actor loss -3.139655888080597e-05

critic loss 2.231660319904983

score 492.46
score 492.46

actor loss 0.0015957562148571016

critic loss 7.004575217816234

score 490.9
score 487.76
score 486.4

actor loss 0.005989841182529926

critic loss 0.2340233024279587

score 486.52
score 485.02

actor loss -6.80685043334961e-09

critic loss 0.14630477923825386

score 483.16
score 482.66

actor loss 0.009422026109695435

critic loss 0.22321198312677443

score 482.8
score 481.58

actor loss 3.15585732460022e-05

critic loss 0.7316428603887558

score 481.36
score 480.92
score 481.0

actor loss 0.01781176798939705

critic loss 0.22754447901844982

score 481.58
score 481.12

actor loss 0.0044956400930881504

critic loss 0.7458092716172338

score 478.48
score

score 384.02
score 376.82
score 377.6

actor loss 0.0009575469017028809

critic loss 15.297923029544577

score 374.78
score 373.34
score 372.72

actor loss 0.013704176509380338

critic loss 0.29619879512451586

score 372.72
score 372.56

actor loss 0.00863651076555252

critic loss 2.604499471011013

score 375.04
score 376.06

actor loss 0.00967038258612156

critic loss 2.6518008948490026

score 377.24
score 378.42

actor loss 0.005855043622851372

critic loss 2.3920616322454067

score 380.26
score 382.54

actor loss 0.018005544888973237

critic loss 2.705842474400625

score 382.16
score 385.6

actor loss -8.868753910064711e-07

critic loss 10.41076061950773

score 389.1
score 392.16

actor loss 0.002340026503801346

critic loss 10.218007160262019

score 396.04
score 397.22

actor loss -0.00012278831005096434

critic loss 18.77972800173238

score 400.66
score 404.54

actor loss 0.00024782993793487547

critic loss 13.817487477785349

score 406.26
score 410.88

actor loss 0.00857107493057

score 425.82

actor loss 0.0010245041966438291

critic loss 0.7147905339863151

score 426.6
score 427.4

actor loss -0.0003822652347327676

critic loss 0.07087218583039939

score 430.42
score 432.56

actor loss 0.0013324921607971191

critic loss 0.4406700833827257

score 433.32
score 433.26
score 433.32

actor loss 0.0005326892886310815

critic loss 0.1933624816558324

score 433.96
score 433.88

actor loss 0.0011735694468021393

critic loss 1.1989550565987828

score 436.3
score 435.38
score 433.0

actor loss 0.006579364725202322

critic loss 0.09562499040104448

score 432.92
score 432.48

actor loss 0.003798525238037109

critic loss 0.1528699609486386

score 431.72
score 430.66
score 429.86

actor loss 0.0006896673202514648

critic loss 0.24094621260678398

score 429.42
score 429.7

actor loss 0.0008973213672637941

critic loss 0.19269132260978222

score 428.98
score 426.84
score 425.58

actor loss 0.0010083640694618225

critic loss 0.18238068932723256

score 423.62
score 422.52

actor

score 499.66

actor loss 5.924934148788452e-06

critic loss 7.898342557442189

score 499.66
score 499.66

actor loss 0.0031986331939697263

critic loss 3.2752853749597444

score 499.66
score 499.78

actor loss 0.0009071262072771789

critic loss 3.8630743441604074

score 499.78
score 499.78

actor loss 0.014520742321014407

critic loss 0.660887120115757

score 499.78
score 499.78

actor loss 0.0008454881072044373

critic loss 6.32519180631116

score 499.78
score 499.78

actor loss 0.004689177346229553

critic loss 2.962343131642044

score 499.78
score 499.78

actor loss 0.0024459016516804695

critic loss 4.621288466045261

score 499.78
score 499.78

actor loss -7.54569560289383e-05

critic loss 2.5698574645660814

score 500.0
score 500.0

actor loss 0.0007754040658473968

critic loss 11.730757413657756

score 500.0
score 500.0

actor loss 0.004532288841903211

critic loss 3.3385103762667625

score 500.0
score 500.0

actor loss 0.0006643427699804305

critic loss 7.4316544735591865

score

critic loss 0.3380437937043607

score 460.5
score 457.42

actor loss 0.01661729247570038

critic loss 0.35563529822677376

score 455.56
score 453.58
score 452.18

actor loss 0.00063095520734787

critic loss 0.13306677848510445

score 450.58
score 449.58

actor loss 0.0037499632358551026

critic loss 0.9515404619239269

score 447.94
score 445.52
score 444.04

actor loss 0.0015078243255615231

critic loss 0.12659742575362326

score 444.74
score 443.12

actor loss 0.0014967007398605345

critic loss 0.15139312722943724

score 441.78
score 443.38
score 443.76

actor loss -3.2845497131347654e-06

critic loss 0.07199638782590627

score 445.62
score 445.16

actor loss 0.002944052982330322

critic loss 0.5457690896034241

score 446.92
score 445.9
score 444.58

actor loss 0.01052138161212206

critic loss 0.06918324795775115

score 442.98
score 441.96

actor loss 0.015673648381233217

critic loss 0.1321013340082951

score 440.98
score 440.46

actor loss 0.0008640961021184921

critic loss 0.620403

score 409.48
score 409.74

actor loss 0.0034239290714263917

critic loss 2.1059901829600336

score 410.3
score 410.98

actor loss 0.006666336531937123

critic loss 0.09033709708750248

score 411.64
score 411.68
score 411.7

actor loss 0.0010620121121406555

critic loss 0.14189205205496397

score 412.32
score 412.9

actor loss 5.5039489269256585e-05

critic loss 0.1369952091321349

score 412.74
score 412.06
score 411.28

actor loss -0.0003938966989517212

critic loss 0.19040583736151456

score 411.1
score 413.04

actor loss 0.00721254848241806

critic loss 0.12383389966897666

score 412.9
score 414.5

actor loss 0.0018953212141990662

critic loss 3.118907176525891

score 415.88
score 417.12
score 418.58

actor loss 0.01112912788391113

critic loss 0.29553515196293595

score 420.2
score 421.96

actor loss 0.0034430736631155014

critic loss 6.5838158209931095

score 423.84
score 426.16

actor loss 0.01138498158454895

critic loss 1.4809529859993606

score 427.18
score 428.72

actor loss -

score 499.56
score 499.56

actor loss -0.0005611806273460388

critic loss 5.2342708634868265

score 499.56
score 499.56

actor loss -3.244421482086181e-05

critic loss 15.030268199373406

score 499.3
score 499.3

actor loss 0.0012215250007808207

critic loss 0.8451382994028739

score 499.22
score 499.14

actor loss 0.00983274759054184

critic loss 1.3332107348920776

score 499.14
score 496.8

actor loss 0.002956715738773346

critic loss 14.309583172818273

score 495.38
score 495.38
score 493.98

actor loss 0.0005378988139331341

critic loss 1.1184307399880142

score 493.88
score 491.04

actor loss 0.002059820385277271

critic loss 0.8414302655730397

score 490.64
score 489.02

actor loss 0.003080154395103454

critic loss 0.7188256610291079

score 489.02
score 488.94

actor loss 2.3677194118499755e-05

critic loss 4.576183077331632

score 488.94
score 488.94

actor loss 1.396633982658386e-05

critic loss 19.703560493683444

score 487.22
score 487.22

actor loss -8.026421070098877e-06

c

score 498.16
score 499.54

actor loss 0.0006315458774566651

critic loss 23.87037184320092

score 499.54
score 499.54

actor loss -0.0002963952302932739

critic loss 33.59643964797259

score 499.54
score 499.54

actor loss 0.00013860380649566653

critic loss 27.899694465954603

score 499.54
score 499.54

actor loss 2.3209473490715028e-05

critic loss 32.16845051883608

score 499.54
score 499.54

actor loss -1.1011433601379396e-05

critic loss 41.18974803789556

score 499.54
score 499.54

actor loss 0.0013223736047744752

critic loss 39.04002297267765

score 499.54
score 499.54

actor loss 0.0022984317660331727

critic loss 43.75867110472321

score 499.54
score 499.54

actor loss -0.00023025437146425242

critic loss 11.787616594068707

score 500.0
score 500.0

actor loss 0.0004585192441940307

critic loss 41.38846582369804

score 500.0
score 500.0

actor loss 0.002617807847261429

critic loss 40.294465853753685

score 500.0
score 500.0

actor loss 0.0010405645370483397

critic loss 35.1

critic loss 25.24719614800364

score 500.0
score 500.0

actor loss 0.0004919267654418946

critic loss 27.34691784814633

score 500.0
score 500.0

actor loss 0.000584494212269783

critic loss 38.079951370525364

score 500.0
score 500.0

actor loss 2.9985070228576658e-06

critic loss 15.694339917068183

score 500.0
score 500.0

actor loss 0.003716758976166602

critic loss 20.769631786400083

score 500.0
score 500.0

actor loss 0.003480416560173035

critic loss 25.171138485121723

score 500.0
score 500.0

actor loss 0.002957936227321625

critic loss 22.249736801800132

score 500.0
score 500.0

actor loss 0.0020538438513875005

critic loss 22.709512302350998

score 500.0
score 500.0

actor loss 0.0003106999337673187

critic loss 27.66031996767223

score 500.0
score 500.0

actor loss 0.0005262937545776366

critic loss 14.131455353188514

score 500.0
score 500.0

actor loss 0.00019952923059463504

critic loss 26.502516425779465

score 500.0
score 500.0

actor loss 7.249746322631837e-05

crit

score 500.0
score 500.0

actor loss 0.001832467743754387

critic loss 25.798233128891884

score 500.0
score 500.0

actor loss 0.00012161843776702882

critic loss 22.504379031953217

score 500.0
score 500.0

actor loss 0.00020469479560852053

critic loss 5.113038014559448

score 500.0
score 500.0

actor loss 0.0033209022760391236

critic loss 5.281892167620361

score 500.0
score 500.0

actor loss 0.005298981681466103

critic loss 5.214785012732445

score 500.0
score 500.0

actor loss 0.000920484232902527

critic loss 2.9845954995393753

score 500.0
score 500.0

actor loss -0.0004255500882863998

critic loss 4.221447555532307

score 500.0
score 500.0

actor loss 0.008581237986683844

critic loss 10.69986176841557

score 500.0
score 500.0

actor loss 0.00012247379124164583

critic loss 24.16633629170209

score 500.0
score 500.0

actor loss 6.833261251449585e-05

critic loss 26.56105506823659

score 500.0
score 500.0

actor loss -2.4141523987054827e-05

critic loss 12.063821493619681

scor

In [None]:
#%reload_ext tensorboard
#%tensorboard --logdir logs/ppo
