In [2]:
import os
import gym
from stable_baselines3 import PPO, TD3, DDPG, A2C , DQN, SAC
from stable_baselines3.common.vec_env import DummyVecEnv
from stable_baselines3.common.evaluation import evaluate_policy
import numpy as np
import time
algorithm_name = "PPO"
environment_name = 'MountainCar-v0'
#environment_names = ['CartPole-v1', 'Acrobot-v1',
#'MountainCar-v0', 'MountainCarContinuous-v0', 'LunarLander-v2', 
#'BipedalWalker-v3', 'CarRacing-v0', Pendulum-v1]
#"BipedalWalker-v3", hardcore=True to make bipedal hardcore environment
env = gym.make(environment_name)



def new_reward_function(state, action, next_state):
    # Extract the current position of the car
    current_position = state[0]

    next_position = next_state[0]

    if next_position >= 0.5:
        reward = 100
    else:
        reward = (next_position - current_position) * 10

    reward -= 1

    return reward



env.reward_func = new_reward_function


In [3]:
episodes = 5
scores = []

for episode in range(1, episodes+1):
    state = env.reset()
    done = False
    score = 0
    
    while not done:
        #env.render()
        action = env.action_space.sample()
        n_state, reward, done, info = env.step(action)
        score += reward
    
    scores.append(score)
    print('Episode:{} Score:{}'.format(episode, score))

env.close()

mean_score = np.mean(scores)
std_score = np.std(scores)
print('Mean Average Score: {:.2f}'.format(mean_score))
print('Standard Deviation: {:.2f}'.format(std_score))

Episode:1 Score:-200.0
Episode:2 Score:-200.0
Episode:3 Score:-200.0
Episode:4 Score:-200.0
Episode:5 Score:-200.0
Mean Average Score: -200.00
Standard Deviation: 0.00


In [4]:
log_path = os.path.join('Training', 'Logs')

if algorithm_name == 'PPO':
    model = PPO('MlpPolicy', env, verbose=1, tensorboard_log=log_path)
elif algorithm_name == 'TD3':
    model = TD3('MlpPolicy', env, verbose=1, tensorboard_log=log_path)
elif algorithm_name == 'DDPG':
    model = DDPG('MlpPolicy', env, verbose=1, tensorboard_log=log_path)
elif algorithm_name == 'A2C':
    model = A2C('MlpPolicy', env, verbose=1, tensorboard_log=log_path)
elif algorithm_name == 'DQN':
    model = DQN('MlpPolicy', env, verbose=1, tensorboard_log=log_path)
elif algorithm_name == 'SAC':
    model = SAC('MlpPolicy', env, verbose=1, tensorboard_log=log_path)
else:
    raise ValueError(f"Invalid algorithm name: {algorithm_name}")

env = gym.make(environment_name)
env = DummyVecEnv([lambda: env])

Using cpu device
Wrapping the env with a `Monitor` wrapper
Wrapping the env in a DummyVecEnv.


In [5]:
start_time = time.time()
number_of_episodes = 10000000


model.learn(total_timesteps=number_of_episodes)

end_time = time.time()
elapsed_time_ms = (end_time - start_time) * 1000
elapsed_time_sec = elapsed_time_ms / 1000

print("Training time: {:.3f} sec".format(elapsed_time_sec))

Logging to Training/Logs/PPO_95
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 200      |
|    ep_rew_mean     | -200     |
| time/              |          |
|    fps             | 2344     |
|    iterations      | 1        |
|    time_elapsed    | 0        |
|    total_timesteps | 2048     |
---------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1733        |
|    iterations           | 2           |
|    time_elapsed         | 2           |
|    total_timesteps      | 4096        |
| train/                  |             |
|    approx_kl            | 0.009201912 |
|    clip_fraction        | 0.0041      |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.1        |
|    explained_variance   | -6.15e-05   

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 200           |
|    ep_rew_mean          | -200          |
| time/                   |               |
|    fps                  | 1354          |
|    iterations           | 11            |
|    time_elapsed         | 16            |
|    total_timesteps      | 22528         |
| train/                  |               |
|    approx_kl            | 0.00079702365 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.08         |
|    explained_variance   | 0.00194       |
|    learning_rate        | 0.0003        |
|    loss                 | 0.508         |
|    n_updates            | 100           |
|    policy_gradient_loss | -4.33e-05     |
|    value_loss           | 9.16          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1301         |
|    iterations           | 21           |
|    time_elapsed         | 33           |
|    total_timesteps      | 43008        |
| train/                  |              |
|    approx_kl            | 0.0028038821 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.07        |
|    explained_variance   | 0.00302      |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0452       |
|    n_updates            | 200          |
|    policy_gradient_loss | -9.2e-05     |
|    value_loss           | 0.0976       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1300        |
|    iterations           | 31          |
|    time_elapsed         | 48          |
|    total_timesteps      | 63488       |
| train/                  |             |
|    approx_kl            | 0.008561455 |
|    clip_fraction        | 0.0437      |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.07       |
|    explained_variance   | -0.00231    |
|    learning_rate        | 0.0003      |
|    loss                 | -0.0122     |
|    n_updates            | 300         |
|    policy_gradient_loss | -0.00298    |
|    value_loss           | 0.00204     |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200   

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1304        |
|    iterations           | 41          |
|    time_elapsed         | 64          |
|    total_timesteps      | 83968       |
| train/                  |             |
|    approx_kl            | 0.008688294 |
|    clip_fraction        | 0.0306      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.972      |
|    explained_variance   | -0.0509     |
|    learning_rate        | 0.0003      |
|    loss                 | -0.00691    |
|    n_updates            | 400         |
|    policy_gradient_loss | -0.00194    |
|    value_loss           | 7.08e-05    |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200 

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 200        |
|    ep_rew_mean          | -200       |
| time/                   |            |
|    fps                  | 1288       |
|    iterations           | 51         |
|    time_elapsed         | 81         |
|    total_timesteps      | 104448     |
| train/                  |            |
|    approx_kl            | 0.00689366 |
|    clip_fraction        | 0.0234     |
|    clip_range           | 0.2        |
|    entropy_loss         | -1.03      |
|    explained_variance   | -0.131     |
|    learning_rate        | 0.0003     |
|    loss                 | -0.0126    |
|    n_updates            | 500        |
|    policy_gradient_loss | -0.00214   |
|    value_loss           | 2.69e-06   |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_re

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1300        |
|    iterations           | 61          |
|    time_elapsed         | 96          |
|    total_timesteps      | 124928      |
| train/                  |             |
|    approx_kl            | 0.010612588 |
|    clip_fraction        | 0.174       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.906      |
|    explained_variance   | 0.362       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0177      |
|    n_updates            | 600         |
|    policy_gradient_loss | -0.00716    |
|    value_loss           | 1.83e-06    |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1320         |
|    iterations           | 71           |
|    time_elapsed         | 110          |
|    total_timesteps      | 145408       |
| train/                  |              |
|    approx_kl            | 0.0012598654 |
|    clip_fraction        | 0.0135       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.293       |
|    explained_variance   | -0.381       |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00312     |
|    n_updates            | 700          |
|    policy_gradient_loss | -0.000305    |
|    value_loss           | 9.54e-07     |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1317        |
|    iterations           | 81          |
|    time_elapsed         | 125         |
|    total_timesteps      | 165888      |
| train/                  |             |
|    approx_kl            | 0.004034522 |
|    clip_fraction        | 0.0332      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.277      |
|    explained_variance   | -0.279      |
|    learning_rate        | 0.0003      |
|    loss                 | -0.00706    |
|    n_updates            | 800         |
|    policy_gradient_loss | -0.00544    |
|    value_loss           | 1.05e-06    |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200 

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 200        |
|    ep_rew_mean          | -200       |
| time/                   |            |
|    fps                  | 1305       |
|    iterations           | 91         |
|    time_elapsed         | 142        |
|    total_timesteps      | 186368     |
| train/                  |            |
|    approx_kl            | 0.00258982 |
|    clip_fraction        | 0.0373     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.285     |
|    explained_variance   | -1.81      |
|    learning_rate        | 0.0003     |
|    loss                 | -0.0178    |
|    n_updates            | 900        |
|    policy_gradient_loss | -0.00416   |
|    value_loss           | 5.09e-07   |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_re

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1293        |
|    iterations           | 101         |
|    time_elapsed         | 159         |
|    total_timesteps      | 206848      |
| train/                  |             |
|    approx_kl            | 0.002584319 |
|    clip_fraction        | 0.0285      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.291      |
|    explained_variance   | -1.83       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.035       |
|    n_updates            | 1000        |
|    policy_gradient_loss | -0.00178    |
|    value_loss           | 5.02e-07    |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1304         |
|    iterations           | 111          |
|    time_elapsed         | 174          |
|    total_timesteps      | 227328       |
| train/                  |              |
|    approx_kl            | 0.0019812118 |
|    clip_fraction        | 0.0235       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.173       |
|    explained_variance   | -0.93        |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00276     |
|    n_updates            | 1100         |
|    policy_gradient_loss | -0.00149     |
|    value_loss           | 4.52e-07     |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1309         |
|    iterations           | 121          |
|    time_elapsed         | 189          |
|    total_timesteps      | 247808       |
| train/                  |              |
|    approx_kl            | 0.0011652806 |
|    clip_fraction        | 0.0102       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.291       |
|    explained_variance   | -1.26        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00064      |
|    n_updates            | 1200         |
|    policy_gradient_loss | 0.000162     |
|    value_loss           | 4.57e-07     |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1308        |
|    iterations           | 131         |
|    time_elapsed         | 204         |
|    total_timesteps      | 268288      |
| train/                  |             |
|    approx_kl            | 0.004796696 |
|    clip_fraction        | 0.031       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.36       |
|    explained_variance   | -0.388      |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0215      |
|    n_updates            | 1300        |
|    policy_gradient_loss | -0.00146    |
|    value_loss           | 4.52e-06    |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1305         |
|    iterations           | 141          |
|    time_elapsed         | 221          |
|    total_timesteps      | 288768       |
| train/                  |              |
|    approx_kl            | 0.0017211775 |
|    clip_fraction        | 0.0328       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.253       |
|    explained_variance   | 0.697        |
|    learning_rate        | 0.0003       |
|    loss                 | -0.0124      |
|    n_updates            | 1400         |
|    policy_gradient_loss | -0.00396     |
|    value_loss           | 8.78e-06     |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1309        |
|    iterations           | 151         |
|    time_elapsed         | 236         |
|    total_timesteps      | 309248      |
| train/                  |             |
|    approx_kl            | 0.003503357 |
|    clip_fraction        | 0.0348      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.216      |
|    explained_variance   | -0.361      |
|    learning_rate        | 0.0003      |
|    loss                 | -0.00749    |
|    n_updates            | 1500        |
|    policy_gradient_loss | -0.00279    |
|    value_loss           | 0.0123      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 20

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1305         |
|    iterations           | 161          |
|    time_elapsed         | 252          |
|    total_timesteps      | 329728       |
| train/                  |              |
|    approx_kl            | 0.0004909203 |
|    clip_fraction        | 0.0042       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.217       |
|    explained_variance   | 0.125        |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00474     |
|    n_updates            | 1600         |
|    policy_gradient_loss | -0.000841    |
|    value_loss           | 4.66e-05     |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1310         |
|    iterations           | 171          |
|    time_elapsed         | 267          |
|    total_timesteps      | 350208       |
| train/                  |              |
|    approx_kl            | 0.0019890103 |
|    clip_fraction        | 0.0128       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.154       |
|    explained_variance   | 0.0689       |
|    learning_rate        | 0.0003       |
|    loss                 | -0.0118      |
|    n_updates            | 1700         |
|    policy_gradient_loss | -0.000804    |
|    value_loss           | 1.19e-05     |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1314         |
|    iterations           | 181          |
|    time_elapsed         | 281          |
|    total_timesteps      | 370688       |
| train/                  |              |
|    approx_kl            | 0.0019322736 |
|    clip_fraction        | 0.00967      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.29        |
|    explained_variance   | 0.0511       |
|    learning_rate        | 0.0003       |
|    loss                 | 0.315        |
|    n_updates            | 1800         |
|    policy_gradient_loss | 0.000227     |
|    value_loss           | 0.411        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1315         |
|    iterations           | 191          |
|    time_elapsed         | 297          |
|    total_timesteps      | 391168       |
| train/                  |              |
|    approx_kl            | 0.0010329211 |
|    clip_fraction        | 0.0113       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.192       |
|    explained_variance   | -0.232       |
|    learning_rate        | 0.0003       |
|    loss                 | -0.0229      |
|    n_updates            | 1900         |
|    policy_gradient_loss | -0.00164     |
|    value_loss           | 0.000285     |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1315        |
|    iterations           | 201         |
|    time_elapsed         | 312         |
|    total_timesteps      | 411648      |
| train/                  |             |
|    approx_kl            | 0.001636044 |
|    clip_fraction        | 0.0156      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.253      |
|    explained_variance   | -0.43       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00305     |
|    n_updates            | 2000        |
|    policy_gradient_loss | -0.000908   |
|    value_loss           | 9.84e-06    |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1314         |
|    iterations           | 211          |
|    time_elapsed         | 328          |
|    total_timesteps      | 432128       |
| train/                  |              |
|    approx_kl            | 0.0013216918 |
|    clip_fraction        | 0.0116       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.251       |
|    explained_variance   | 0.0876       |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00124      |
|    n_updates            | 2100         |
|    policy_gradient_loss | -0.000917    |
|    value_loss           | 2.46e-06     |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1316         |
|    iterations           | 221          |
|    time_elapsed         | 343          |
|    total_timesteps      | 452608       |
| train/                  |              |
|    approx_kl            | 0.0041546845 |
|    clip_fraction        | 0.024        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.235       |
|    explained_variance   | 0.181        |
|    learning_rate        | 0.0003       |
|    loss                 | -0.0194      |
|    n_updates            | 2200         |
|    policy_gradient_loss | -0.00346     |
|    value_loss           | 1.76e-06     |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1318         |
|    iterations           | 231          |
|    time_elapsed         | 358          |
|    total_timesteps      | 473088       |
| train/                  |              |
|    approx_kl            | 0.0007779846 |
|    clip_fraction        | 0.0108       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.184       |
|    explained_variance   | 0.325        |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00427     |
|    n_updates            | 2300         |
|    policy_gradient_loss | -0.000552    |
|    value_loss           | 1.25e-05     |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 200         |
|    ep_rew_mean          | -200        |
| time/                   |             |
|    fps                  | 1319        |
|    iterations           | 241         |
|    time_elapsed         | 374         |
|    total_timesteps      | 493568      |
| train/                  |             |
|    approx_kl            | 0.001486085 |
|    clip_fraction        | 0.0108      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.297      |
|    explained_variance   | -1.32       |
|    learning_rate        | 0.0003      |
|    loss                 | -0.00336    |
|    n_updates            | 2400        |
|    policy_gradient_loss | -0.00107    |
|    value_loss           | 6.23e-07    |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1316         |
|    iterations           | 251          |
|    time_elapsed         | 390          |
|    total_timesteps      | 514048       |
| train/                  |              |
|    approx_kl            | 0.0047019473 |
|    clip_fraction        | 0.0383       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.293       |
|    explained_variance   | 0.718        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.032        |
|    n_updates            | 2500         |
|    policy_gradient_loss | -0.00154     |
|    value_loss           | 0.123        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 200          |
|    ep_rew_mean          | -200         |
| time/                   |              |
|    fps                  | 1317         |
|    iterations           | 261          |
|    time_elapsed         | 405          |
|    total_timesteps      | 534528       |
| train/                  |              |
|    approx_kl            | 8.399383e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.397       |
|    explained_variance   | 0.538        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.167        |
|    n_updates            | 2600         |
|    policy_gradient_loss | 2.63e-05     |
|    value_loss           | 11.3         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 199          |
|    ep_rew_mean          | -199         |
| time/                   |              |
|    fps                  | 1321         |
|    iterations           | 271          |
|    time_elapsed         | 420          |
|    total_timesteps      | 555008       |
| train/                  |              |
|    approx_kl            | 0.0017119071 |
|    clip_fraction        | 0.0165       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.379       |
|    explained_variance   | 0.83         |
|    learning_rate        | 0.0003       |
|    loss                 | 2.25         |
|    n_updates            | 2700         |
|    policy_gradient_loss | -0.000396    |
|    value_loss           | 12.7         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 196          |
|    ep_rew_mean          | -196         |
| time/                   |              |
|    fps                  | 1320         |
|    iterations           | 281          |
|    time_elapsed         | 435          |
|    total_timesteps      | 575488       |
| train/                  |              |
|    approx_kl            | 0.0017474527 |
|    clip_fraction        | 0.00625      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.452       |
|    explained_variance   | 0.879        |
|    learning_rate        | 0.0003       |
|    loss                 | 18.7         |
|    n_updates            | 2800         |
|    policy_gradient_loss | -0.00152     |
|    value_loss           | 34.8         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 193          |
|    ep_rew_mean          | -193         |
| time/                   |              |
|    fps                  | 1323         |
|    iterations           | 291          |
|    time_elapsed         | 450          |
|    total_timesteps      | 595968       |
| train/                  |              |
|    approx_kl            | 0.0062871296 |
|    clip_fraction        | 0.0395       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.326       |
|    explained_variance   | 0.953        |
|    learning_rate        | 0.0003       |
|    loss                 | 7.3          |
|    n_updates            | 2900         |
|    policy_gradient_loss | -0.00631     |
|    value_loss           | 19           |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 171         |
|    ep_rew_mean          | -171        |
| time/                   |             |
|    fps                  | 1325        |
|    iterations           | 301         |
|    time_elapsed         | 464         |
|    total_timesteps      | 616448      |
| train/                  |             |
|    approx_kl            | 0.005606047 |
|    clip_fraction        | 0.0499      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.278      |
|    explained_variance   | 0.984       |
|    learning_rate        | 0.0003      |
|    loss                 | 4.32        |
|    n_updates            | 3000        |
|    policy_gradient_loss | -0.00354    |
|    value_loss           | 8.62        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 167 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 127           |
|    ep_rew_mean          | -127          |
| time/                   |               |
|    fps                  | 1327          |
|    iterations           | 311           |
|    time_elapsed         | 479           |
|    total_timesteps      | 636928        |
| train/                  |               |
|    approx_kl            | 0.00084639154 |
|    clip_fraction        | 0.0171        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.181        |
|    explained_variance   | 0.989         |
|    learning_rate        | 0.0003        |
|    loss                 | 2.48          |
|    n_updates            | 3100          |
|    policy_gradient_loss | -0.00096      |
|    value_loss           | 4.43          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 117         |
|    ep_rew_mean          | -117        |
| time/                   |             |
|    fps                  | 1326        |
|    iterations           | 321         |
|    time_elapsed         | 495         |
|    total_timesteps      | 657408      |
| train/                  |             |
|    approx_kl            | 0.002676291 |
|    clip_fraction        | 0.0223      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.131      |
|    explained_variance   | 0.988       |
|    learning_rate        | 0.0003      |
|    loss                 | 2.48        |
|    n_updates            | 3200        |
|    policy_gradient_loss | -0.00177    |
|    value_loss           | 3.83        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 117 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 118           |
|    ep_rew_mean          | -118          |
| time/                   |               |
|    fps                  | 1325          |
|    iterations           | 331           |
|    time_elapsed         | 511           |
|    total_timesteps      | 677888        |
| train/                  |               |
|    approx_kl            | 0.00043310493 |
|    clip_fraction        | 0.0158        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0926       |
|    explained_variance   | 0.989         |
|    learning_rate        | 0.0003        |
|    loss                 | 1.59          |
|    n_updates            | 3300          |
|    policy_gradient_loss | 0.00199       |
|    value_loss           | 3.02          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 113          |
|    ep_rew_mean          | -113         |
| time/                   |              |
|    fps                  | 1326         |
|    iterations           | 341          |
|    time_elapsed         | 526          |
|    total_timesteps      | 698368       |
| train/                  |              |
|    approx_kl            | 0.0033912892 |
|    clip_fraction        | 0.0167       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.086       |
|    explained_variance   | 0.981        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.07         |
|    n_updates            | 3400         |
|    policy_gradient_loss | -0.00024     |
|    value_loss           | 2.86         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 113         |
|    ep_rew_mean          | -113        |
| time/                   |             |
|    fps                  | 1326        |
|    iterations           | 351         |
|    time_elapsed         | 541         |
|    total_timesteps      | 718848      |
| train/                  |             |
|    approx_kl            | 0.003284119 |
|    clip_fraction        | 0.0257      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0725     |
|    explained_variance   | 0.991       |
|    learning_rate        | 0.0003      |
|    loss                 | 1.89        |
|    n_updates            | 3500        |
|    policy_gradient_loss | 0.000459    |
|    value_loss           | 3.03        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 111 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 112          |
|    ep_rew_mean          | -112         |
| time/                   |              |
|    fps                  | 1329         |
|    iterations           | 361          |
|    time_elapsed         | 556          |
|    total_timesteps      | 739328       |
| train/                  |              |
|    approx_kl            | 0.0024858662 |
|    clip_fraction        | 0.0206       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0732      |
|    explained_variance   | 0.985        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.744        |
|    n_updates            | 3600         |
|    policy_gradient_loss | 0.00232      |
|    value_loss           | 3.6          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 109         |
|    ep_rew_mean          | -109        |
| time/                   |             |
|    fps                  | 1331        |
|    iterations           | 371         |
|    time_elapsed         | 570         |
|    total_timesteps      | 759808      |
| train/                  |             |
|    approx_kl            | 0.000715032 |
|    clip_fraction        | 0.0154      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.065      |
|    explained_variance   | 0.989       |
|    learning_rate        | 0.0003      |
|    loss                 | 2.65        |
|    n_updates            | 3700        |
|    policy_gradient_loss | 0.000294    |
|    value_loss           | 3.47        |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 107   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 114          |
|    ep_rew_mean          | -114         |
| time/                   |              |
|    fps                  | 1330         |
|    iterations           | 381          |
|    time_elapsed         | 586          |
|    total_timesteps      | 780288       |
| train/                  |              |
|    approx_kl            | 0.0019040093 |
|    clip_fraction        | 0.0197       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0643      |
|    explained_variance   | 0.965        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.09         |
|    n_updates            | 3800         |
|    policy_gradient_loss | 0.0018       |
|    value_loss           | 4.35         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 107         |
|    ep_rew_mean          | -107        |
| time/                   |             |
|    fps                  | 1327        |
|    iterations           | 391         |
|    time_elapsed         | 603         |
|    total_timesteps      | 800768      |
| train/                  |             |
|    approx_kl            | 0.000683604 |
|    clip_fraction        | 0.0187      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0535     |
|    explained_variance   | 0.998       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.154       |
|    n_updates            | 3900        |
|    policy_gradient_loss | -0.000284   |
|    value_loss           | 0.507       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 10

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 115          |
|    ep_rew_mean          | -115         |
| time/                   |              |
|    fps                  | 1326         |
|    iterations           | 401          |
|    time_elapsed         | 619          |
|    total_timesteps      | 821248       |
| train/                  |              |
|    approx_kl            | 0.0070939055 |
|    clip_fraction        | 0.0305       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0587      |
|    explained_variance   | 0.981        |
|    learning_rate        | 0.0003       |
|    loss                 | 3.75         |
|    n_updates            | 4000         |
|    policy_gradient_loss | -0.00189     |
|    value_loss           | 5.84         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1325         |
|    iterations           | 411          |
|    time_elapsed         | 634          |
|    total_timesteps      | 841728       |
| train/                  |              |
|    approx_kl            | 0.0013679587 |
|    clip_fraction        | 0.0163       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0514      |
|    explained_variance   | 0.997        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.197        |
|    n_updates            | 4100         |
|    policy_gradient_loss | 0.000655     |
|    value_loss           | 0.502        |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 110           |
|    ep_rew_mean          | -110          |
| time/                   |               |
|    fps                  | 1328          |
|    iterations           | 421           |
|    time_elapsed         | 649           |
|    total_timesteps      | 862208        |
| train/                  |               |
|    approx_kl            | 0.00080697716 |
|    clip_fraction        | 0.00898       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0653       |
|    explained_variance   | 0.982         |
|    learning_rate        | 0.0003        |
|    loss                 | 3.02          |
|    n_updates            | 4200          |
|    policy_gradient_loss | -0.00104      |
|    value_loss           | 6.14          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 104         |
|    ep_rew_mean          | -104        |
| time/                   |             |
|    fps                  | 1330        |
|    iterations           | 431         |
|    time_elapsed         | 663         |
|    total_timesteps      | 882688      |
| train/                  |             |
|    approx_kl            | 0.013884405 |
|    clip_fraction        | 0.024       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0528     |
|    explained_variance   | 0.994       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.777       |
|    n_updates            | 4300        |
|    policy_gradient_loss | -0.00486    |
|    value_loss           | 1.82        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1332         |
|    iterations           | 441          |
|    time_elapsed         | 677          |
|    total_timesteps      | 903168       |
| train/                  |              |
|    approx_kl            | 0.0016099401 |
|    clip_fraction        | 0.00923      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0536      |
|    explained_variance   | 0.985        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.82         |
|    n_updates            | 4400         |
|    policy_gradient_loss | 0.000117     |
|    value_loss           | 3.36         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1335         |
|    iterations           | 451          |
|    time_elapsed         | 691          |
|    total_timesteps      | 923648       |
| train/                  |              |
|    approx_kl            | 0.0025592349 |
|    clip_fraction        | 0.0195       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.061       |
|    explained_variance   | 0.994        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.812        |
|    n_updates            | 4500         |
|    policy_gradient_loss | -0.000681    |
|    value_loss           | 2.08         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 114          |
|    ep_rew_mean          | -114         |
| time/                   |              |
|    fps                  | 1337         |
|    iterations           | 461          |
|    time_elapsed         | 706          |
|    total_timesteps      | 944128       |
| train/                  |              |
|    approx_kl            | 0.0015214409 |
|    clip_fraction        | 0.0189       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0566      |
|    explained_variance   | 0.994        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.51         |
|    n_updates            | 4600         |
|    policy_gradient_loss | 0.000826     |
|    value_loss           | 2.08         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 107          |
|    ep_rew_mean          | -107         |
| time/                   |              |
|    fps                  | 1339         |
|    iterations           | 471          |
|    time_elapsed         | 720          |
|    total_timesteps      | 964608       |
| train/                  |              |
|    approx_kl            | 0.0013172337 |
|    clip_fraction        | 0.0196       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0523      |
|    explained_variance   | 0.983        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.65         |
|    n_updates            | 4700         |
|    policy_gradient_loss | 0.000441     |
|    value_loss           | 2.94         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1341         |
|    iterations           | 481          |
|    time_elapsed         | 734          |
|    total_timesteps      | 985088       |
| train/                  |              |
|    approx_kl            | 0.0021263857 |
|    clip_fraction        | 0.019        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0712      |
|    explained_variance   | 0.985        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.35         |
|    n_updates            | 4800         |
|    policy_gradient_loss | -0.000641    |
|    value_loss           | 2.42         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 109         |
|    ep_rew_mean          | -109        |
| time/                   |             |
|    fps                  | 1342        |
|    iterations           | 491         |
|    time_elapsed         | 748         |
|    total_timesteps      | 1005568     |
| train/                  |             |
|    approx_kl            | 0.001792809 |
|    clip_fraction        | 0.0183      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0695     |
|    explained_variance   | 0.979       |
|    learning_rate        | 0.0003      |
|    loss                 | 4.61        |
|    n_updates            | 4900        |
|    policy_gradient_loss | -0.00129    |
|    value_loss           | 6.79        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 501          |
|    time_elapsed         | 763          |
|    total_timesteps      | 1026048      |
| train/                  |              |
|    approx_kl            | 0.0020544133 |
|    clip_fraction        | 0.0261       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0711      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0636       |
|    n_updates            | 5000         |
|    policy_gradient_loss | -0.000259    |
|    value_loss           | 0.506        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 108          |
|    ep_rew_mean          | -108         |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 511          |
|    time_elapsed         | 777          |
|    total_timesteps      | 1046528      |
| train/                  |              |
|    approx_kl            | 0.0006357593 |
|    clip_fraction        | 0.00576      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0692      |
|    explained_variance   | 0.956        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.77         |
|    n_updates            | 5100         |
|    policy_gradient_loss | -0.000245    |
|    value_loss           | 7.43         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 118          |
|    ep_rew_mean          | -118         |
| time/                   |              |
|    fps                  | 1348         |
|    iterations           | 521          |
|    time_elapsed         | 791          |
|    total_timesteps      | 1067008      |
| train/                  |              |
|    approx_kl            | 0.0011929304 |
|    clip_fraction        | 0.0123       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0805      |
|    explained_variance   | 0.955        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.372        |
|    n_updates            | 5200         |
|    policy_gradient_loss | -0.00182     |
|    value_loss           | 6.96         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 531          |
|    time_elapsed         | 805          |
|    total_timesteps      | 1087488      |
| train/                  |              |
|    approx_kl            | 0.0017215498 |
|    clip_fraction        | 0.0156       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0647      |
|    explained_variance   | 0.997        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0987       |
|    n_updates            | 5300         |
|    policy_gradient_loss | 0.000141     |
|    value_loss           | 0.383        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 107         |
|    ep_rew_mean          | -107        |
| time/                   |             |
|    fps                  | 1350        |
|    iterations           | 541         |
|    time_elapsed         | 820         |
|    total_timesteps      | 1107968     |
| train/                  |             |
|    approx_kl            | 0.007376973 |
|    clip_fraction        | 0.0214      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.071      |
|    explained_variance   | 0.988       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.93        |
|    n_updates            | 5400        |
|    policy_gradient_loss | -0.00211    |
|    value_loss           | 2.61        |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 107   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 109          |
|    ep_rew_mean          | -109         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 551          |
|    time_elapsed         | 834          |
|    total_timesteps      | 1128448      |
| train/                  |              |
|    approx_kl            | 0.0015892212 |
|    clip_fraction        | 0.0224       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.073       |
|    explained_variance   | 0.989        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.14         |
|    n_updates            | 5500         |
|    policy_gradient_loss | 5.96e-05     |
|    value_loss           | 3.23         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 561          |
|    time_elapsed         | 849          |
|    total_timesteps      | 1148928      |
| train/                  |              |
|    approx_kl            | 0.0004974324 |
|    clip_fraction        | 0.00967      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0476      |
|    explained_variance   | 0.974        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.09         |
|    n_updates            | 5600         |
|    policy_gradient_loss | -0.00224     |
|    value_loss           | 6.42         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 571          |
|    time_elapsed         | 866          |
|    total_timesteps      | 1169408      |
| train/                  |              |
|    approx_kl            | 0.0047831344 |
|    clip_fraction        | 0.0216       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0559      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0637       |
|    n_updates            | 5700         |
|    policy_gradient_loss | 0.00151      |
|    value_loss           | 0.217        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104          |
|    ep_rew_mean          | -104         |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 581          |
|    time_elapsed         | 881          |
|    total_timesteps      | 1189888      |
| train/                  |              |
|    approx_kl            | 0.0016029631 |
|    clip_fraction        | 0.013        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0582      |
|    explained_variance   | 0.984        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.65         |
|    n_updates            | 5800         |
|    policy_gradient_loss | -0.00101     |
|    value_loss           | 3.29         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 109          |
|    ep_rew_mean          | -109         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 591          |
|    time_elapsed         | 895          |
|    total_timesteps      | 1210368      |
| train/                  |              |
|    approx_kl            | 0.0008829377 |
|    clip_fraction        | 0.0159       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.088       |
|    explained_variance   | 0.925        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.56         |
|    n_updates            | 5900         |
|    policy_gradient_loss | 0.000529     |
|    value_loss           | 5.78         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101         |
|    ep_rew_mean          | -101        |
| time/                   |             |
|    fps                  | 1353        |
|    iterations           | 601         |
|    time_elapsed         | 909         |
|    total_timesteps      | 1230848     |
| train/                  |             |
|    approx_kl            | 0.000891188 |
|    clip_fraction        | 0.00947     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0691     |
|    explained_variance   | 0.995       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.348       |
|    n_updates            | 6000        |
|    policy_gradient_loss | 7.58e-07    |
|    value_loss           | 0.979       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102 

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100         |
|    ep_rew_mean          | -100        |
| time/                   |             |
|    fps                  | 1354        |
|    iterations           | 611         |
|    time_elapsed         | 923         |
|    total_timesteps      | 1251328     |
| train/                  |             |
|    approx_kl            | 0.004586188 |
|    clip_fraction        | 0.019       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0531     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0653      |
|    n_updates            | 6100        |
|    policy_gradient_loss | -0.000162   |
|    value_loss           | 0.13        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100 

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.7        |
|    ep_rew_mean          | -99.7       |
| time/                   |             |
|    fps                  | 1355        |
|    iterations           | 621         |
|    time_elapsed         | 938         |
|    total_timesteps      | 1271808     |
| train/                  |             |
|    approx_kl            | 0.014746558 |
|    clip_fraction        | 0.0115      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0631     |
|    explained_variance   | 0.988       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.423       |
|    n_updates            | 6200        |
|    policy_gradient_loss | -0.0047     |
|    value_loss           | 1.97        |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 10

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 631          |
|    time_elapsed         | 953          |
|    total_timesteps      | 1292288      |
| train/                  |              |
|    approx_kl            | 0.0014664232 |
|    clip_fraction        | 0.0161       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0581      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.18         |
|    n_updates            | 6300         |
|    policy_gradient_loss | -0.000344    |
|    value_loss           | 1.44         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 641          |
|    time_elapsed         | 968          |
|    total_timesteps      | 1312768      |
| train/                  |              |
|    approx_kl            | 0.0014882376 |
|    clip_fraction        | 0.014        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0485      |
|    explained_variance   | 0.985        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.209        |
|    n_updates            | 6400         |
|    policy_gradient_loss | -0.000787    |
|    value_loss           | 0.908        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 651          |
|    time_elapsed         | 985          |
|    total_timesteps      | 1333248      |
| train/                  |              |
|    approx_kl            | 0.0019625884 |
|    clip_fraction        | 0.0178       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0648      |
|    explained_variance   | 0.989        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.24         |
|    n_updates            | 6500         |
|    policy_gradient_loss | -0.00148     |
|    value_loss           | 1.45         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 661          |
|    time_elapsed         | 1001         |
|    total_timesteps      | 1353728      |
| train/                  |              |
|    approx_kl            | 0.0021647795 |
|    clip_fraction        | 0.0169       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0469      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.116        |
|    n_updates            | 6600         |
|    policy_gradient_loss | 0.00142      |
|    value_loss           | 0.177        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.3        |
|    ep_rew_mean          | -99.3       |
| time/                   |             |
|    fps                  | 1351        |
|    iterations           | 671         |
|    time_elapsed         | 1016        |
|    total_timesteps      | 1374208     |
| train/                  |             |
|    approx_kl            | 0.002930522 |
|    clip_fraction        | 0.017       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0434     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0606      |
|    n_updates            | 6700        |
|    policy_gradient_loss | -8.29e-05   |
|    value_loss           | 0.159       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 98

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 100           |
|    ep_rew_mean          | -100          |
| time/                   |               |
|    fps                  | 1351          |
|    iterations           | 681           |
|    time_elapsed         | 1032          |
|    total_timesteps      | 1394688       |
| train/                  |               |
|    approx_kl            | 0.00096181687 |
|    clip_fraction        | 0.017         |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.051        |
|    explained_variance   | 0.992         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.693         |
|    n_updates            | 6800          |
|    policy_gradient_loss | -0.000194     |
|    value_loss           | 1.41          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 691          |
|    time_elapsed         | 1048         |
|    total_timesteps      | 1415168      |
| train/                  |              |
|    approx_kl            | 0.0014381888 |
|    clip_fraction        | 0.0111       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0491      |
|    explained_variance   | 0.99         |
|    learning_rate        | 0.0003       |
|    loss                 | 0.564        |
|    n_updates            | 6900         |
|    policy_gradient_loss | 0.000669     |
|    value_loss           | 1.25         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100         |
|    ep_rew_mean          | -100        |
| time/                   |             |
|    fps                  | 1350        |
|    iterations           | 701         |
|    time_elapsed         | 1063        |
|    total_timesteps      | 1435648     |
| train/                  |             |
|    approx_kl            | 0.006482565 |
|    clip_fraction        | 0.0256      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0558     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0544      |
|    n_updates            | 7000        |
|    policy_gradient_loss | 0.00119     |
|    value_loss           | 0.103       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.2         |
|    ep_rew_mean          | -98.2        |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 711          |
|    time_elapsed         | 1077         |
|    total_timesteps      | 1456128      |
| train/                  |              |
|    approx_kl            | 0.0008861753 |
|    clip_fraction        | 0.0144       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0479      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0293       |
|    n_updates            | 7100         |
|    policy_gradient_loss | 0.000425     |
|    value_loss           | 0.144        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 102         |
|    ep_rew_mean          | -102        |
| time/                   |             |
|    fps                  | 1350        |
|    iterations           | 721         |
|    time_elapsed         | 1093        |
|    total_timesteps      | 1476608     |
| train/                  |             |
|    approx_kl            | 0.000821337 |
|    clip_fraction        | 0.0114      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0472     |
|    explained_variance   | 0.998       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.345       |
|    n_updates            | 7200        |
|    policy_gradient_loss | 0.000305    |
|    value_loss           | 0.745       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 100           |
|    ep_rew_mean          | -100          |
| time/                   |               |
|    fps                  | 1349          |
|    iterations           | 731           |
|    time_elapsed         | 1109          |
|    total_timesteps      | 1497088       |
| train/                  |               |
|    approx_kl            | 0.00024679827 |
|    clip_fraction        | 0.00308       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0494       |
|    explained_variance   | 0.987         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.411         |
|    n_updates            | 7300          |
|    policy_gradient_loss | -0.000636     |
|    value_loss           | 2.25          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 741          |
|    time_elapsed         | 1124         |
|    total_timesteps      | 1517568      |
| train/                  |              |
|    approx_kl            | 0.0025104275 |
|    clip_fraction        | 0.0203       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0539      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0405       |
|    n_updates            | 7400         |
|    policy_gradient_loss | 0.000927     |
|    value_loss           | 0.0537       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 751          |
|    time_elapsed         | 1140         |
|    total_timesteps      | 1538048      |
| train/                  |              |
|    approx_kl            | 0.0075855916 |
|    clip_fraction        | 0.0277       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0582      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0339       |
|    n_updates            | 7500         |
|    policy_gradient_loss | 0.000581     |
|    value_loss           | 0.038        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 102           |
|    ep_rew_mean          | -102          |
| time/                   |               |
|    fps                  | 1348          |
|    iterations           | 761           |
|    time_elapsed         | 1155          |
|    total_timesteps      | 1558528       |
| train/                  |               |
|    approx_kl            | 0.00027071763 |
|    clip_fraction        | 0.00718       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0483       |
|    explained_variance   | 0.988         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.63          |
|    n_updates            | 7600          |
|    policy_gradient_loss | -0.000303     |
|    value_loss           | 4.11          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1347         |
|    iterations           | 771          |
|    time_elapsed         | 1171         |
|    total_timesteps      | 1579008      |
| train/                  |              |
|    approx_kl            | 0.0010144463 |
|    clip_fraction        | 0.0191       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.05        |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0464       |
|    n_updates            | 7700         |
|    policy_gradient_loss | 5.54e-05     |
|    value_loss           | 0.195        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99           |
|    ep_rew_mean          | -99          |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 781          |
|    time_elapsed         | 1187         |
|    total_timesteps      | 1599488      |
| train/                  |              |
|    approx_kl            | 0.0048777373 |
|    clip_fraction        | 0.0251       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0649      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0128       |
|    n_updates            | 7800         |
|    policy_gradient_loss | 0.00681      |
|    value_loss           | 0.0535       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 791          |
|    time_elapsed         | 1203         |
|    total_timesteps      | 1619968      |
| train/                  |              |
|    approx_kl            | 0.0024451087 |
|    clip_fraction        | 0.0225       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0506      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0154       |
|    n_updates            | 7900         |
|    policy_gradient_loss | -0.00395     |
|    value_loss           | 0.0289       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 100        |
|    ep_rew_mean          | -100       |
| time/                   |            |
|    fps                  | 1345       |
|    iterations           | 801        |
|    time_elapsed         | 1218       |
|    total_timesteps      | 1640448    |
| train/                  |            |
|    approx_kl            | 0.02984215 |
|    clip_fraction        | 0.0297     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0447    |
|    explained_variance   | 1          |
|    learning_rate        | 0.0003     |
|    loss                 | 0.00583    |
|    n_updates            | 8000       |
|    policy_gradient_loss | -0.00155   |
|    value_loss           | 0.0243     |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_re

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1345         |
|    iterations           | 811          |
|    time_elapsed         | 1234         |
|    total_timesteps      | 1660928      |
| train/                  |              |
|    approx_kl            | 0.0018380292 |
|    clip_fraction        | 0.019        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.038       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0277       |
|    n_updates            | 8100         |
|    policy_gradient_loss | 0.00212      |
|    value_loss           | 0.0534       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.4         |
|    ep_rew_mean          | -99.4        |
| time/                   |              |
|    fps                  | 1345         |
|    iterations           | 821          |
|    time_elapsed         | 1249         |
|    total_timesteps      | 1681408      |
| train/                  |              |
|    approx_kl            | 0.0024312735 |
|    clip_fraction        | 0.0157       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0443      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0691       |
|    n_updates            | 8200         |
|    policy_gradient_loss | -7.73e-05    |
|    value_loss           | 0.329        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.1         |
|    ep_rew_mean          | -98.1        |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 831          |
|    time_elapsed         | 1265         |
|    total_timesteps      | 1701888      |
| train/                  |              |
|    approx_kl            | 0.0010245721 |
|    clip_fraction        | 0.00986      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0395      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.49         |
|    n_updates            | 8300         |
|    policy_gradient_loss | -0.00106     |
|    value_loss           | 0.313        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99           |
|    ep_rew_mean          | -99          |
| time/                   |              |
|    fps                  | 1345         |
|    iterations           | 841          |
|    time_elapsed         | 1280         |
|    total_timesteps      | 1722368      |
| train/                  |              |
|    approx_kl            | 0.0014000579 |
|    clip_fraction        | 0.0128       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.044       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0704       |
|    n_updates            | 8400         |
|    policy_gradient_loss | 0.00121      |
|    value_loss           | 0.0905       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.5        |
|    ep_rew_mean          | -99.5       |
| time/                   |             |
|    fps                  | 1346        |
|    iterations           | 851         |
|    time_elapsed         | 1294        |
|    total_timesteps      | 1742848     |
| train/                  |             |
|    approx_kl            | 0.015801094 |
|    clip_fraction        | 0.0414      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0644     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0127      |
|    n_updates            | 8500        |
|    policy_gradient_loss | 0.00501     |
|    value_loss           | 0.0324      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.7

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.4         |
|    ep_rew_mean          | -97.4        |
| time/                   |              |
|    fps                  | 1347         |
|    iterations           | 861          |
|    time_elapsed         | 1308         |
|    total_timesteps      | 1763328      |
| train/                  |              |
|    approx_kl            | 0.0040132697 |
|    clip_fraction        | 0.0187       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0366      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0307       |
|    n_updates            | 8600         |
|    policy_gradient_loss | 0.00348      |
|    value_loss           | 0.0249       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.7         |
|    ep_rew_mean          | -98.7        |
| time/                   |              |
|    fps                  | 1348         |
|    iterations           | 871          |
|    time_elapsed         | 1323         |
|    total_timesteps      | 1783808      |
| train/                  |              |
|    approx_kl            | 0.0029298556 |
|    clip_fraction        | 0.0144       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0433      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00674      |
|    n_updates            | 8700         |
|    policy_gradient_loss | 0.00033      |
|    value_loss           | 0.0174       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99          |
|    ep_rew_mean          | -99         |
| time/                   |             |
|    fps                  | 1347        |
|    iterations           | 881         |
|    time_elapsed         | 1339        |
|    total_timesteps      | 1804288     |
| train/                  |             |
|    approx_kl            | 0.005519688 |
|    clip_fraction        | 0.0262      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0415     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.115       |
|    n_updates            | 8800        |
|    policy_gradient_loss | -0.00125    |
|    value_loss           | 0.105       |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.2  

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100         |
|    ep_rew_mean          | -100        |
| time/                   |             |
|    fps                  | 1346        |
|    iterations           | 891         |
|    time_elapsed         | 1355        |
|    total_timesteps      | 1824768     |
| train/                  |             |
|    approx_kl            | 0.017091302 |
|    clip_fraction        | 0.0513      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0642     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00825     |
|    n_updates            | 8900        |
|    policy_gradient_loss | -0.000246   |
|    value_loss           | 0.0235      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1345         |
|    iterations           | 901          |
|    time_elapsed         | 1371         |
|    total_timesteps      | 1845248      |
| train/                  |              |
|    approx_kl            | 0.0008516512 |
|    clip_fraction        | 0.00557      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0425      |
|    explained_variance   | 0.985        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.57         |
|    n_updates            | 9000         |
|    policy_gradient_loss | -0.000319    |
|    value_loss           | 4.32         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99          |
|    ep_rew_mean          | -99         |
| time/                   |             |
|    fps                  | 1344        |
|    iterations           | 911         |
|    time_elapsed         | 1387        |
|    total_timesteps      | 1865728     |
| train/                  |             |
|    approx_kl            | 0.001304907 |
|    clip_fraction        | 0.014       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0505     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0198      |
|    n_updates            | 9100        |
|    policy_gradient_loss | 0.000283    |
|    value_loss           | 0.0507      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.4

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100         |
|    ep_rew_mean          | -100        |
| time/                   |             |
|    fps                  | 1344        |
|    iterations           | 921         |
|    time_elapsed         | 1402        |
|    total_timesteps      | 1886208     |
| train/                  |             |
|    approx_kl            | 0.122004725 |
|    clip_fraction        | 0.0139      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0387     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0522      |
|    n_updates            | 9200        |
|    policy_gradient_loss | -0.0014     |
|    value_loss           | 0.0692      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 103           |
|    ep_rew_mean          | -103          |
| time/                   |               |
|    fps                  | 1344          |
|    iterations           | 931           |
|    time_elapsed         | 1418          |
|    total_timesteps      | 1906688       |
| train/                  |               |
|    approx_kl            | 0.00065160065 |
|    clip_fraction        | 0.0118        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0328       |
|    explained_variance   | 0.964         |
|    learning_rate        | 0.0003        |
|    loss                 | 3.07          |
|    n_updates            | 9300          |
|    policy_gradient_loss | -0.000697     |
|    value_loss           | 6.3           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98           |
|    ep_rew_mean          | -98          |
| time/                   |              |
|    fps                  | 1345         |
|    iterations           | 941          |
|    time_elapsed         | 1432         |
|    total_timesteps      | 1927168      |
| train/                  |              |
|    approx_kl            | 0.0015916413 |
|    clip_fraction        | 0.018        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0578      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0439       |
|    n_updates            | 9400         |
|    policy_gradient_loss | 0.00147      |
|    value_loss           | 0.0756       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3         |
|    ep_rew_mean          | -98.3        |
| time/                   |              |
|    fps                  | 1345         |
|    iterations           | 951          |
|    time_elapsed         | 1447         |
|    total_timesteps      | 1947648      |
| train/                  |              |
|    approx_kl            | 0.0009713182 |
|    clip_fraction        | 0.011        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0481      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00695      |
|    n_updates            | 9500         |
|    policy_gradient_loss | -5.41e-05    |
|    value_loss           | 0.0244       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 961          |
|    time_elapsed         | 1462         |
|    total_timesteps      | 1968128      |
| train/                  |              |
|    approx_kl            | 0.0024942795 |
|    clip_fraction        | 0.0157       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0449      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.08         |
|    n_updates            | 9600         |
|    policy_gradient_loss | -0.000772    |
|    value_loss           | 0.813        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.2        |
|    ep_rew_mean          | -98.2       |
| time/                   |             |
|    fps                  | 1345        |
|    iterations           | 971         |
|    time_elapsed         | 1477        |
|    total_timesteps      | 1988608     |
| train/                  |             |
|    approx_kl            | 0.003293166 |
|    clip_fraction        | 0.0163      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.04       |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00875     |
|    n_updates            | 9700        |
|    policy_gradient_loss | -0.000375   |
|    value_loss           | 0.0235      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.2

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.2         |
|    ep_rew_mean          | -99.2        |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 981          |
|    time_elapsed         | 1494         |
|    total_timesteps      | 2009088      |
| train/                  |              |
|    approx_kl            | 0.0022954016 |
|    clip_fraction        | 0.0104       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0357      |
|    explained_variance   | 0.991        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0917       |
|    n_updates            | 9800         |
|    policy_gradient_loss | 0.000347     |
|    value_loss           | 0.632        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 105         |
|    ep_rew_mean          | -105        |
| time/                   |             |
|    fps                  | 1343        |
|    iterations           | 991         |
|    time_elapsed         | 1510        |
|    total_timesteps      | 2029568     |
| train/                  |             |
|    approx_kl            | 0.002832003 |
|    clip_fraction        | 0.0163      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0562     |
|    explained_variance   | 0.935       |
|    learning_rate        | 0.0003      |
|    loss                 | 14.3        |
|    n_updates            | 9900        |
|    policy_gradient_loss | -0.0051     |
|    value_loss           | 19.3        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1343         |
|    iterations           | 1001         |
|    time_elapsed         | 1525         |
|    total_timesteps      | 2050048      |
| train/                  |              |
|    approx_kl            | 0.0043346174 |
|    clip_fraction        | 0.0143       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0399      |
|    explained_variance   | 0.99         |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0529       |
|    n_updates            | 10000        |
|    policy_gradient_loss | 0.000144     |
|    value_loss           | 0.628        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.8         |
|    ep_rew_mean          | -98.8        |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 1011         |
|    time_elapsed         | 1540         |
|    total_timesteps      | 2070528      |
| train/                  |              |
|    approx_kl            | 0.0028180294 |
|    clip_fraction        | 0.0209       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0559      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0142       |
|    n_updates            | 10100        |
|    policy_gradient_loss | 0.00162      |
|    value_loss           | 0.0505       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.9         |
|    ep_rew_mean          | -96.9        |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 1021         |
|    time_elapsed         | 1555         |
|    total_timesteps      | 2091008      |
| train/                  |              |
|    approx_kl            | 0.0043300684 |
|    clip_fraction        | 0.0185       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0376      |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0194       |
|    n_updates            | 10200        |
|    policy_gradient_loss | -0.000705    |
|    value_loss           | 0.102        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

--------------------------------------
| rollout/                |          |
|    ep_len_mean          | 96.9     |
|    ep_rew_mean          | -96.9    |
| time/                   |          |
|    fps                  | 1344     |
|    iterations           | 1031     |
|    time_elapsed         | 1569     |
|    total_timesteps      | 2111488  |
| train/                  |          |
|    approx_kl            | 0.033656 |
|    clip_fraction        | 0.0346   |
|    clip_range           | 0.2      |
|    entropy_loss         | -0.053   |
|    explained_variance   | 1        |
|    learning_rate        | 0.0003   |
|    loss                 | 0.0236   |
|    n_updates            | 10300    |
|    policy_gradient_loss | 0.0261   |
|    value_loss           | 0.0379   |
--------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.5        |
|    ep_rew_mean          | -97.5       |
| time/      

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 105        |
|    ep_rew_mean          | -105       |
| time/                   |            |
|    fps                  | 1344       |
|    iterations           | 1041       |
|    time_elapsed         | 1585       |
|    total_timesteps      | 2131968    |
| train/                  |            |
|    approx_kl            | 0.07522903 |
|    clip_fraction        | 0.0591     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.058     |
|    explained_variance   | 1          |
|    learning_rate        | 0.0003     |
|    loss                 | -0.00923   |
|    n_updates            | 10400      |
|    policy_gradient_loss | -0.00234   |
|    value_loss           | 0.0231     |
----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 110           |
|    ep

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 125          |
|    ep_rew_mean          | -125         |
| time/                   |              |
|    fps                  | 1343         |
|    iterations           | 1051         |
|    time_elapsed         | 1601         |
|    total_timesteps      | 2152448      |
| train/                  |              |
|    approx_kl            | 0.0036713153 |
|    clip_fraction        | 0.0182       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0616      |
|    explained_variance   | 0.934        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.622        |
|    n_updates            | 10500        |
|    policy_gradient_loss | -0.000584    |
|    value_loss           | 4.47         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 159          |
|    ep_rew_mean          | -159         |
| time/                   |              |
|    fps                  | 1343         |
|    iterations           | 1061         |
|    time_elapsed         | 1616         |
|    total_timesteps      | 2172928      |
| train/                  |              |
|    approx_kl            | 0.0018136525 |
|    clip_fraction        | 0.017        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.064       |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.167        |
|    n_updates            | 10600        |
|    policy_gradient_loss | 9.58e-05     |
|    value_loss           | 0.532        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 153          |
|    ep_rew_mean          | -153         |
| time/                   |              |
|    fps                  | 1343         |
|    iterations           | 1071         |
|    time_elapsed         | 1632         |
|    total_timesteps      | 2193408      |
| train/                  |              |
|    approx_kl            | 0.0031079631 |
|    clip_fraction        | 0.0251       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.074       |
|    explained_variance   | 0.997        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.449        |
|    n_updates            | 10700        |
|    policy_gradient_loss | -0.00201     |
|    value_loss           | 1.19         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 150          |
|    ep_rew_mean          | -150         |
| time/                   |              |
|    fps                  | 1343         |
|    iterations           | 1081         |
|    time_elapsed         | 1647         |
|    total_timesteps      | 2213888      |
| train/                  |              |
|    approx_kl            | 0.0016223271 |
|    clip_fraction        | 0.0155       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0666      |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.244        |
|    n_updates            | 10800        |
|    policy_gradient_loss | 0.000739     |
|    value_loss           | 0.802        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 147          |
|    ep_rew_mean          | -147         |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 1091         |
|    time_elapsed         | 1662         |
|    total_timesteps      | 2234368      |
| train/                  |              |
|    approx_kl            | 0.0015260392 |
|    clip_fraction        | 0.018        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0719      |
|    explained_variance   | 0.996        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.37         |
|    n_updates            | 10900        |
|    policy_gradient_loss | -0.000841    |
|    value_loss           | 0.674        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 141          |
|    ep_rew_mean          | -141         |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 1101         |
|    time_elapsed         | 1676         |
|    total_timesteps      | 2254848      |
| train/                  |              |
|    approx_kl            | 0.0018311924 |
|    clip_fraction        | 0.014        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0596      |
|    explained_variance   | 0.979        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.432        |
|    n_updates            | 11000        |
|    policy_gradient_loss | -0.00186     |
|    value_loss           | 2.12         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 132          |
|    ep_rew_mean          | -132         |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 1111         |
|    time_elapsed         | 1692         |
|    total_timesteps      | 2275328      |
| train/                  |              |
|    approx_kl            | 0.0071019977 |
|    clip_fraction        | 0.0245       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0632      |
|    explained_variance   | 0.997        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.404        |
|    n_updates            | 11100        |
|    policy_gradient_loss | -0.0017      |
|    value_loss           | 0.852        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 122          |
|    ep_rew_mean          | -122         |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 1121         |
|    time_elapsed         | 1707         |
|    total_timesteps      | 2295808      |
| train/                  |              |
|    approx_kl            | 0.0073292674 |
|    clip_fraction        | 0.0228       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0678      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.697        |
|    n_updates            | 11200        |
|    policy_gradient_loss | 0.00197      |
|    value_loss           | 1.29         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 105         |
|    ep_rew_mean          | -105        |
| time/                   |             |
|    fps                  | 1345        |
|    iterations           | 1131        |
|    time_elapsed         | 1722        |
|    total_timesteps      | 2316288     |
| train/                  |             |
|    approx_kl            | 0.002548865 |
|    clip_fraction        | 0.0241      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0569     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.116       |
|    n_updates            | 11300       |
|    policy_gradient_loss | 0.000366    |
|    value_loss           | 0.232       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 121          |
|    ep_rew_mean          | -121         |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 1141         |
|    time_elapsed         | 1737         |
|    total_timesteps      | 2336768      |
| train/                  |              |
|    approx_kl            | 0.0010214336 |
|    clip_fraction        | 0.0194       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0689      |
|    explained_variance   | 0.993        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.02         |
|    n_updates            | 11400        |
|    policy_gradient_loss | -0.00114     |
|    value_loss           | 2.47         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 107          |
|    ep_rew_mean          | -107         |
| time/                   |              |
|    fps                  | 1344         |
|    iterations           | 1151         |
|    time_elapsed         | 1753         |
|    total_timesteps      | 2357248      |
| train/                  |              |
|    approx_kl            | 0.0018407436 |
|    clip_fraction        | 0.0252       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0701      |
|    explained_variance   | 0.961        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.31         |
|    n_updates            | 11500        |
|    policy_gradient_loss | -0.004       |
|    value_loss           | 11.4         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 104         |
|    ep_rew_mean          | -104        |
| time/                   |             |
|    fps                  | 1343        |
|    iterations           | 1161        |
|    time_elapsed         | 1769        |
|    total_timesteps      | 2377728     |
| train/                  |             |
|    approx_kl            | 0.003034031 |
|    clip_fraction        | 0.0198      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0588     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0737      |
|    n_updates            | 11600       |
|    policy_gradient_loss | -0.000143   |
|    value_loss           | 0.123       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 10

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99          |
|    ep_rew_mean          | -99         |
| time/                   |             |
|    fps                  | 1344        |
|    iterations           | 1171        |
|    time_elapsed         | 1783        |
|    total_timesteps      | 2398208     |
| train/                  |             |
|    approx_kl            | 0.004778099 |
|    clip_fraction        | 0.0266      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0481     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.04        |
|    n_updates            | 11700       |
|    policy_gradient_loss | 0.00258     |
|    value_loss           | 0.106       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.6

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 108          |
|    ep_rew_mean          | -108         |
| time/                   |              |
|    fps                  | 1345         |
|    iterations           | 1181         |
|    time_elapsed         | 1798         |
|    total_timesteps      | 2418688      |
| train/                  |              |
|    approx_kl            | 0.0012465157 |
|    clip_fraction        | 0.0109       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0461      |
|    explained_variance   | 0.962        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.02         |
|    n_updates            | 11800        |
|    policy_gradient_loss | 0.00236      |
|    value_loss           | 3            |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 105        |
|    ep_rew_mean          | -105       |
| time/                   |            |
|    fps                  | 1346       |
|    iterations           | 1191       |
|    time_elapsed         | 1812       |
|    total_timesteps      | 2439168    |
| train/                  |            |
|    approx_kl            | 0.00099069 |
|    clip_fraction        | 0.00879    |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0548    |
|    explained_variance   | 0.982      |
|    learning_rate        | 0.0003     |
|    loss                 | 0.903      |
|    n_updates            | 11900      |
|    policy_gradient_loss | -0.00124   |
|    value_loss           | 3.37       |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_re

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 1201         |
|    time_elapsed         | 1826         |
|    total_timesteps      | 2459648      |
| train/                  |              |
|    approx_kl            | 0.0011656295 |
|    clip_fraction        | 0.00996      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0435      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.116        |
|    n_updates            | 12000        |
|    policy_gradient_loss | -0.00148     |
|    value_loss           | 0.576        |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6         |
|    ep_rew_mean          | -99.6        |
| time/                   |              |
|    fps                  | 1347         |
|    iterations           | 1211         |
|    time_elapsed         | 1840         |
|    total_timesteps      | 2480128      |
| train/                  |              |
|    approx_kl            | 0.0029413954 |
|    clip_fraction        | 0.0149       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0411      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0629       |
|    n_updates            | 12100        |
|    policy_gradient_loss | 0.00105      |
|    value_loss           | 0.181        |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1348         |
|    iterations           | 1221         |
|    time_elapsed         | 1854         |
|    total_timesteps      | 2500608      |
| train/                  |              |
|    approx_kl            | 0.0030344245 |
|    clip_fraction        | 0.0138       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0461      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0197       |
|    n_updates            | 12200        |
|    policy_gradient_loss | -0.000792    |
|    value_loss           | 0.201        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.9         |
|    ep_rew_mean          | -99.9        |
| time/                   |              |
|    fps                  | 1348         |
|    iterations           | 1231         |
|    time_elapsed         | 1869         |
|    total_timesteps      | 2521088      |
| train/                  |              |
|    approx_kl            | 0.0010763435 |
|    clip_fraction        | 0.011        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0313      |
|    explained_variance   | 0.987        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.237        |
|    n_updates            | 12300        |
|    policy_gradient_loss | -0.00144     |
|    value_loss           | 0.971        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 1241         |
|    time_elapsed         | 1883         |
|    total_timesteps      | 2541568      |
| train/                  |              |
|    approx_kl            | 0.0025397947 |
|    clip_fraction        | 0.0218       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0505      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0138       |
|    n_updates            | 12400        |
|    policy_gradient_loss | 0.0108       |
|    value_loss           | 0.0575       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 1251         |
|    time_elapsed         | 1898         |
|    total_timesteps      | 2562048      |
| train/                  |              |
|    approx_kl            | 0.0013124151 |
|    clip_fraction        | 0.0108       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0415      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0232       |
|    n_updates            | 12500        |
|    policy_gradient_loss | -0.00189     |
|    value_loss           | 0.0454       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.3         |
|    ep_rew_mean          | -99.3        |
| time/                   |              |
|    fps                  | 1348         |
|    iterations           | 1261         |
|    time_elapsed         | 1915         |
|    total_timesteps      | 2582528      |
| train/                  |              |
|    approx_kl            | 0.0016448745 |
|    clip_fraction        | 0.0157       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0406      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0149       |
|    n_updates            | 12600        |
|    policy_gradient_loss | 0.000983     |
|    value_loss           | 0.0258       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8         |
|    ep_rew_mean          | -97.8        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 1271         |
|    time_elapsed         | 1929         |
|    total_timesteps      | 2603008      |
| train/                  |              |
|    approx_kl            | 0.0011120344 |
|    clip_fraction        | 0.0129       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0274      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00562     |
|    n_updates            | 12700        |
|    policy_gradient_loss | 0.000683     |
|    value_loss           | 0.0236       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.6         |
|    ep_rew_mean          | -98.6        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 1281         |
|    time_elapsed         | 1943         |
|    total_timesteps      | 2623488      |
| train/                  |              |
|    approx_kl            | 0.0010572432 |
|    clip_fraction        | 0.0107       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0252      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00674      |
|    n_updates            | 12800        |
|    policy_gradient_loss | 0.00137      |
|    value_loss           | 0.0238       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8         |
|    ep_rew_mean          | -97.8        |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 1291         |
|    time_elapsed         | 1958         |
|    total_timesteps      | 2643968      |
| train/                  |              |
|    approx_kl            | 0.0016532815 |
|    clip_fraction        | 0.02         |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0386      |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.16         |
|    n_updates            | 12900        |
|    policy_gradient_loss | -0.0032      |
|    value_loss           | 0.513        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98           |
|    ep_rew_mean          | -98          |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 1301         |
|    time_elapsed         | 1972         |
|    total_timesteps      | 2664448      |
| train/                  |              |
|    approx_kl            | 0.0031065461 |
|    clip_fraction        | 0.023        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0286      |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0397       |
|    n_updates            | 13000        |
|    policy_gradient_loss | 0.00118      |
|    value_loss           | 0.139        |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.9         |
|    ep_rew_mean          | -99.9        |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 1311         |
|    time_elapsed         | 1987         |
|    total_timesteps      | 2684928      |
| train/                  |              |
|    approx_kl            | 0.0017602679 |
|    clip_fraction        | 0.0141       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0455      |
|    explained_variance   | 0.996        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0642       |
|    n_updates            | 13100        |
|    policy_gradient_loss | 0.000115     |
|    value_loss           | 0.209        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.1        |
|    ep_rew_mean          | -99.1       |
| time/                   |             |
|    fps                  | 1351        |
|    iterations           | 1321        |
|    time_elapsed         | 2001        |
|    total_timesteps      | 2705408     |
| train/                  |             |
|    approx_kl            | 0.024337072 |
|    clip_fraction        | 0.0279      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.035      |
|    explained_variance   | 0.992       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0877      |
|    n_updates            | 13200       |
|    policy_gradient_loss | 0.00315     |
|    value_loss           | 0.356       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101         |
|    ep_rew_mean          | -101        |
| time/                   |             |
|    fps                  | 1351        |
|    iterations           | 1331        |
|    time_elapsed         | 2017        |
|    total_timesteps      | 2725888     |
| train/                  |             |
|    approx_kl            | 0.002076606 |
|    clip_fraction        | 0.0191      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0374     |
|    explained_variance   | 0.986       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.188       |
|    n_updates            | 13300       |
|    policy_gradient_loss | -0.00148    |
|    value_loss           | 0.941       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.3

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 102           |
|    ep_rew_mean          | -102          |
| time/                   |               |
|    fps                  | 1351          |
|    iterations           | 1341          |
|    time_elapsed         | 2032          |
|    total_timesteps      | 2746368       |
| train/                  |               |
|    approx_kl            | 0.00078534026 |
|    clip_fraction        | 0.0082        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0547       |
|    explained_variance   | 0.979         |
|    learning_rate        | 0.0003        |
|    loss                 | 1.18          |
|    n_updates            | 13400         |
|    policy_gradient_loss | -0.000824     |
|    value_loss           | 5.71          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 1351         |
|    time_elapsed         | 2047         |
|    total_timesteps      | 2766848      |
| train/                  |              |
|    approx_kl            | 0.0011073875 |
|    clip_fraction        | 0.0122       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0538      |
|    explained_variance   | 0.988        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.163        |
|    n_updates            | 13500        |
|    policy_gradient_loss | 0.000447     |
|    value_loss           | 1.02         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 1361         |
|    time_elapsed         | 2062         |
|    total_timesteps      | 2787328      |
| train/                  |              |
|    approx_kl            | 0.0014227782 |
|    clip_fraction        | 0.0202       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0412      |
|    explained_variance   | 0.994        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.104        |
|    n_updates            | 13600        |
|    policy_gradient_loss | 0.000577     |
|    value_loss           | 0.391        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.8         |
|    ep_rew_mean          | -99.8        |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 1371         |
|    time_elapsed         | 2077         |
|    total_timesteps      | 2807808      |
| train/                  |              |
|    approx_kl            | 0.0024891894 |
|    clip_fraction        | 0.0212       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0555      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0079       |
|    n_updates            | 13700        |
|    policy_gradient_loss | 0.00174      |
|    value_loss           | 0.0397       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1381         |
|    time_elapsed         | 2091         |
|    total_timesteps      | 2828288      |
| train/                  |              |
|    approx_kl            | 0.0042972798 |
|    clip_fraction        | 0.0253       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0595      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0155       |
|    n_updates            | 13800        |
|    policy_gradient_loss | -0.00137     |
|    value_loss           | 0.0353       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.5         |
|    ep_rew_mean          | -97.5        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1391         |
|    time_elapsed         | 2106         |
|    total_timesteps      | 2848768      |
| train/                  |              |
|    approx_kl            | 0.0012229318 |
|    clip_fraction        | 0.0167       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0572      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0199       |
|    n_updates            | 13900        |
|    policy_gradient_loss | 0.000649     |
|    value_loss           | 0.041        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3         |
|    ep_rew_mean          | -98.3        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1401         |
|    time_elapsed         | 2120         |
|    total_timesteps      | 2869248      |
| train/                  |              |
|    approx_kl            | 0.0030584992 |
|    clip_fraction        | 0.0161       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0445      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.013        |
|    n_updates            | 14000        |
|    policy_gradient_loss | 0.0016       |
|    value_loss           | 0.041        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.7         |
|    ep_rew_mean          | -98.7        |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 1411         |
|    time_elapsed         | 2135         |
|    total_timesteps      | 2889728      |
| train/                  |              |
|    approx_kl            | 0.0013326628 |
|    clip_fraction        | 0.0133       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.049       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0195       |
|    n_updates            | 14100        |
|    policy_gradient_loss | -0.000765    |
|    value_loss           | 0.0252       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6         |
|    ep_rew_mean          | -99.6        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1421         |
|    time_elapsed         | 2151         |
|    total_timesteps      | 2910208      |
| train/                  |              |
|    approx_kl            | 0.0016049193 |
|    clip_fraction        | 0.0187       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0459      |
|    explained_variance   | 0.985        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.761        |
|    n_updates            | 14200        |
|    policy_gradient_loss | -0.00277     |
|    value_loss           | 3.68         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 1431         |
|    time_elapsed         | 2168         |
|    total_timesteps      | 2930688      |
| train/                  |              |
|    approx_kl            | 0.0010682878 |
|    clip_fraction        | 0.013        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0398      |
|    explained_variance   | 0.991        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.625        |
|    n_updates            | 14300        |
|    policy_gradient_loss | -0.00263     |
|    value_loss           | 1.61         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 113           |
|    ep_rew_mean          | -113          |
| time/                   |               |
|    fps                  | 1351          |
|    iterations           | 1441          |
|    time_elapsed         | 2183          |
|    total_timesteps      | 2951168       |
| train/                  |               |
|    approx_kl            | 0.00089867547 |
|    clip_fraction        | 0.0113        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0633       |
|    explained_variance   | 0.936         |
|    learning_rate        | 0.0003        |
|    loss                 | 3.25          |
|    n_updates            | 14400         |
|    policy_gradient_loss | -0.00315      |
|    value_loss           | 12.6          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 104         |
|    ep_rew_mean          | -104        |
| time/                   |             |
|    fps                  | 1351        |
|    iterations           | 1451        |
|    time_elapsed         | 2198        |
|    total_timesteps      | 2971648     |
| train/                  |             |
|    approx_kl            | 0.005688617 |
|    clip_fraction        | 0.0292      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0476     |
|    explained_variance   | 0.996       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.051       |
|    n_updates            | 14500       |
|    policy_gradient_loss | 0.00152     |
|    value_loss           | 0.252       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 108          |
|    ep_rew_mean          | -108         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 1461         |
|    time_elapsed         | 2213         |
|    total_timesteps      | 2992128      |
| train/                  |              |
|    approx_kl            | 0.0015136729 |
|    clip_fraction        | 0.0178       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0711      |
|    explained_variance   | 0.957        |
|    learning_rate        | 0.0003       |
|    loss                 | 4.98         |
|    n_updates            | 14600        |
|    policy_gradient_loss | -0.00126     |
|    value_loss           | 7.85         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 104         |
|    ep_rew_mean          | -104        |
| time/                   |             |
|    fps                  | 1352        |
|    iterations           | 1471        |
|    time_elapsed         | 2228        |
|    total_timesteps      | 3012608     |
| train/                  |             |
|    approx_kl            | 0.006188411 |
|    clip_fraction        | 0.0203      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0542     |
|    explained_variance   | 0.993       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.134       |
|    n_updates            | 14700       |
|    policy_gradient_loss | 0.00209     |
|    value_loss           | 0.283       |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1481         |
|    time_elapsed         | 2243         |
|    total_timesteps      | 3033088      |
| train/                  |              |
|    approx_kl            | 0.0020475308 |
|    clip_fraction        | 0.00864      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0603      |
|    explained_variance   | 0.988        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.27         |
|    n_updates            | 14800        |
|    policy_gradient_loss | 0.000243     |
|    value_loss           | 2.48         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1491         |
|    time_elapsed         | 2257         |
|    total_timesteps      | 3053568      |
| train/                  |              |
|    approx_kl            | 0.0018001862 |
|    clip_fraction        | 0.0126       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0498      |
|    explained_variance   | 0.993        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.817        |
|    n_updates            | 14900        |
|    policy_gradient_loss | 9.05e-05     |
|    value_loss           | 1.27         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99           |
|    ep_rew_mean          | -99          |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1501         |
|    time_elapsed         | 2272         |
|    total_timesteps      | 3074048      |
| train/                  |              |
|    approx_kl            | 0.0007327548 |
|    clip_fraction        | 0.0115       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.03        |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0207       |
|    n_updates            | 15000        |
|    policy_gradient_loss | 0.00236      |
|    value_loss           | 0.0368       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 108          |
|    ep_rew_mean          | -108         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1511         |
|    time_elapsed         | 2288         |
|    total_timesteps      | 3094528      |
| train/                  |              |
|    approx_kl            | 0.0006389606 |
|    clip_fraction        | 0.0116       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0457      |
|    explained_variance   | 0.966        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.607        |
|    n_updates            | 15100        |
|    policy_gradient_loss | -0.000135    |
|    value_loss           | 6.45         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101         |
|    ep_rew_mean          | -101        |
| time/                   |             |
|    fps                  | 1352        |
|    iterations           | 1521        |
|    time_elapsed         | 2303        |
|    total_timesteps      | 3115008     |
| train/                  |             |
|    approx_kl            | 0.011533879 |
|    clip_fraction        | 0.0234      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0369     |
|    explained_variance   | 0.995       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.146       |
|    n_updates            | 15200       |
|    policy_gradient_loss | 0.00061     |
|    value_loss           | 0.251       |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.4  

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101         |
|    ep_rew_mean          | -101        |
| time/                   |             |
|    fps                  | 1352        |
|    iterations           | 1531        |
|    time_elapsed         | 2318        |
|    total_timesteps      | 3135488     |
| train/                  |             |
|    approx_kl            | 0.009957068 |
|    clip_fraction        | 0.0349      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.067      |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | -0.00317    |
|    n_updates            | 15300       |
|    policy_gradient_loss | -0.00127    |
|    value_loss           | 0.0435      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 10

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6         |
|    ep_rew_mean          | -99.6        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1541         |
|    time_elapsed         | 2332         |
|    total_timesteps      | 3155968      |
| train/                  |              |
|    approx_kl            | 0.0035486273 |
|    clip_fraction        | 0.0244       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0781      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00976      |
|    n_updates            | 15400        |
|    policy_gradient_loss | -7.95e-05    |
|    value_loss           | 0.0748       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.4         |
|    ep_rew_mean          | -99.4        |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 1551         |
|    time_elapsed         | 2347         |
|    total_timesteps      | 3176448      |
| train/                  |              |
|    approx_kl            | 0.0030027803 |
|    clip_fraction        | 0.0193       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.054       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.01         |
|    n_updates            | 15500        |
|    policy_gradient_loss | -0.00138     |
|    value_loss           | 0.0341       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.7         |
|    ep_rew_mean          | -97.7        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1561         |
|    time_elapsed         | 2362         |
|    total_timesteps      | 3196928      |
| train/                  |              |
|    approx_kl            | 0.0027195858 |
|    clip_fraction        | 0.0188       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0471      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00838      |
|    n_updates            | 15600        |
|    policy_gradient_loss | 0.00106      |
|    value_loss           | 0.038        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5         |
|    ep_rew_mean          | -98.5        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 1571         |
|    time_elapsed         | 2378         |
|    total_timesteps      | 3217408      |
| train/                  |              |
|    approx_kl            | 0.0018984069 |
|    clip_fraction        | 0.0214       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0546      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0274       |
|    n_updates            | 15700        |
|    policy_gradient_loss | 0.000985     |
|    value_loss           | 0.067        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.6        |
|    ep_rew_mean          | -99.6       |
| time/                   |             |
|    fps                  | 1353        |
|    iterations           | 1581        |
|    time_elapsed         | 2392        |
|    total_timesteps      | 3237888     |
| train/                  |             |
|    approx_kl            | 0.000572535 |
|    clip_fraction        | 0.00669     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0485     |
|    explained_variance   | 0.983       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.956       |
|    n_updates            | 15800       |
|    policy_gradient_loss | -0.00268    |
|    value_loss           | 3.67        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.5         |
|    ep_rew_mean          | -99.5        |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 1591         |
|    time_elapsed         | 2406         |
|    total_timesteps      | 3258368      |
| train/                  |              |
|    approx_kl            | 0.0024036623 |
|    clip_fraction        | 0.0181       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0508      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00805      |
|    n_updates            | 15900        |
|    policy_gradient_loss | 0.00197      |
|    value_loss           | 0.0358       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 1601         |
|    time_elapsed         | 2422         |
|    total_timesteps      | 3278848      |
| train/                  |              |
|    approx_kl            | 0.0018306791 |
|    clip_fraction        | 0.018        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0642      |
|    explained_variance   | 0.953        |
|    learning_rate        | 0.0003       |
|    loss                 | 14.2         |
|    n_updates            | 16000        |
|    policy_gradient_loss | -0.00376     |
|    value_loss           | 13.1         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 1611         |
|    time_elapsed         | 2438         |
|    total_timesteps      | 3299328      |
| train/                  |              |
|    approx_kl            | 0.0008333378 |
|    clip_fraction        | 0.0277       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0612      |
|    explained_variance   | 0.927        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.326        |
|    n_updates            | 16100        |
|    policy_gradient_loss | 0.00116      |
|    value_loss           | 4.48         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.9         |
|    ep_rew_mean          | -99.9        |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 1621         |
|    time_elapsed         | 2453         |
|    total_timesteps      | 3319808      |
| train/                  |              |
|    approx_kl            | 0.0027997117 |
|    clip_fraction        | 0.0234       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0564      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.000246     |
|    n_updates            | 16200        |
|    policy_gradient_loss | 0.000214     |
|    value_loss           | 0.0256       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 164          |
|    ep_rew_mean          | -164         |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 1631         |
|    time_elapsed         | 2468         |
|    total_timesteps      | 3340288      |
| train/                  |              |
|    approx_kl            | 0.0055031385 |
|    clip_fraction        | 0.0281       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0708      |
|    explained_variance   | 0.993        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.345        |
|    n_updates            | 16300        |
|    policy_gradient_loss | -0.000218    |
|    value_loss           | 1.63         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 155          |
|    ep_rew_mean          | -155         |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 1641         |
|    time_elapsed         | 2482         |
|    total_timesteps      | 3360768      |
| train/                  |              |
|    approx_kl            | 0.0016547608 |
|    clip_fraction        | 0.0176       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0936      |
|    explained_variance   | 0.987        |
|    learning_rate        | 0.0003       |
|    loss                 | 5.89         |
|    n_updates            | 16400        |
|    policy_gradient_loss | -0.00157     |
|    value_loss           | 4.96         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104          |
|    ep_rew_mean          | -104         |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 1651         |
|    time_elapsed         | 2497         |
|    total_timesteps      | 3381248      |
| train/                  |              |
|    approx_kl            | 0.0032882392 |
|    clip_fraction        | 0.0202       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0459      |
|    explained_variance   | 0.991        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.16         |
|    n_updates            | 16500        |
|    policy_gradient_loss | 0.0019       |
|    value_loss           | 0.589        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 101           |
|    ep_rew_mean          | -101          |
| time/                   |               |
|    fps                  | 1354          |
|    iterations           | 1661          |
|    time_elapsed         | 2512          |
|    total_timesteps      | 3401728       |
| train/                  |               |
|    approx_kl            | 0.00058215676 |
|    clip_fraction        | 0.0111        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0458       |
|    explained_variance   | 0.997         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.0965        |
|    n_updates            | 16600         |
|    policy_gradient_loss | 0.000474      |
|    value_loss           | 0.342         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.7         |
|    ep_rew_mean          | -99.7        |
| time/                   |              |
|    fps                  | 1354         |
|    iterations           | 1671         |
|    time_elapsed         | 2526         |
|    total_timesteps      | 3422208      |
| train/                  |              |
|    approx_kl            | 0.0011302631 |
|    clip_fraction        | 0.0121       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0434      |
|    explained_variance   | 0.985        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.87         |
|    n_updates            | 16700        |
|    policy_gradient_loss | -0.00132     |
|    value_loss           | 2.92         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100         |
|    ep_rew_mean          | -100        |
| time/                   |             |
|    fps                  | 1354        |
|    iterations           | 1681        |
|    time_elapsed         | 2542        |
|    total_timesteps      | 3442688     |
| train/                  |             |
|    approx_kl            | 0.004195101 |
|    clip_fraction        | 0.0201      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0399     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0393      |
|    n_updates            | 16800       |
|    policy_gradient_loss | 0.00131     |
|    value_loss           | 0.0498      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.8

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1354         |
|    iterations           | 1691         |
|    time_elapsed         | 2556         |
|    total_timesteps      | 3463168      |
| train/                  |              |
|    approx_kl            | 0.0024207076 |
|    clip_fraction        | 0.0197       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0515      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0244       |
|    n_updates            | 16900        |
|    policy_gradient_loss | 0.00217      |
|    value_loss           | 0.0662       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 104           |
|    ep_rew_mean          | -104          |
| time/                   |               |
|    fps                  | 1354          |
|    iterations           | 1701          |
|    time_elapsed         | 2571          |
|    total_timesteps      | 3483648       |
| train/                  |               |
|    approx_kl            | 0.00051011133 |
|    clip_fraction        | 0.00928       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0447       |
|    explained_variance   | 0.987         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.441         |
|    n_updates            | 17000         |
|    policy_gradient_loss | -0.00161      |
|    value_loss           | 1.74          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1354         |
|    iterations           | 1711         |
|    time_elapsed         | 2587         |
|    total_timesteps      | 3504128      |
| train/                  |              |
|    approx_kl            | 0.0022445437 |
|    clip_fraction        | 0.0211       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0419      |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0901       |
|    n_updates            | 17100        |
|    policy_gradient_loss | -0.000488    |
|    value_loss           | 0.324        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1354         |
|    iterations           | 1721         |
|    time_elapsed         | 2601         |
|    total_timesteps      | 3524608      |
| train/                  |              |
|    approx_kl            | 0.0026510595 |
|    clip_fraction        | 0.0171       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0365      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0125       |
|    n_updates            | 17200        |
|    policy_gradient_loss | -0.00102     |
|    value_loss           | 0.0527       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.2         |
|    ep_rew_mean          | -99.2        |
| time/                   |              |
|    fps                  | 1354         |
|    iterations           | 1731         |
|    time_elapsed         | 2616         |
|    total_timesteps      | 3545088      |
| train/                  |              |
|    approx_kl            | 0.0010096777 |
|    clip_fraction        | 0.0138       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0512      |
|    explained_variance   | 0.976        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.835        |
|    n_updates            | 17300        |
|    policy_gradient_loss | -0.00111     |
|    value_loss           | 3.61         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.9         |
|    ep_rew_mean          | -98.9        |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 1741         |
|    time_elapsed         | 2630         |
|    total_timesteps      | 3565568      |
| train/                  |              |
|    approx_kl            | 0.0034089135 |
|    clip_fraction        | 0.0171       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0367      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00887      |
|    n_updates            | 17400        |
|    policy_gradient_loss | -0.00122     |
|    value_loss           | 0.0447       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 114          |
|    ep_rew_mean          | -114         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 1751         |
|    time_elapsed         | 2645         |
|    total_timesteps      | 3586048      |
| train/                  |              |
|    approx_kl            | 0.0007427668 |
|    clip_fraction        | 0.00835      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0465      |
|    explained_variance   | 0.956        |
|    learning_rate        | 0.0003       |
|    loss                 | 13.9         |
|    n_updates            | 17500        |
|    policy_gradient_loss | -0.000811    |
|    value_loss           | 6.64         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 1761         |
|    time_elapsed         | 2660         |
|    total_timesteps      | 3606528      |
| train/                  |              |
|    approx_kl            | 0.0005710982 |
|    clip_fraction        | 0.013        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0469      |
|    explained_variance   | 0.968        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.27         |
|    n_updates            | 17600        |
|    policy_gradient_loss | -0.00177     |
|    value_loss           | 8.23         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 104           |
|    ep_rew_mean          | -104          |
| time/                   |               |
|    fps                  | 1355          |
|    iterations           | 1771          |
|    time_elapsed         | 2675          |
|    total_timesteps      | 3627008       |
| train/                  |               |
|    approx_kl            | 0.00047859873 |
|    clip_fraction        | 0.00977       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0582       |
|    explained_variance   | 0.906         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.772         |
|    n_updates            | 17700         |
|    policy_gradient_loss | -1.91e-05     |
|    value_loss           | 12.3          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 1781         |
|    time_elapsed         | 2690         |
|    total_timesteps      | 3647488      |
| train/                  |              |
|    approx_kl            | 0.0019601085 |
|    clip_fraction        | 0.0191       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0607      |
|    explained_variance   | 0.986        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.433        |
|    n_updates            | 17800        |
|    policy_gradient_loss | -0.00115     |
|    value_loss           | 1.37         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 111          |
|    ep_rew_mean          | -111         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 1791         |
|    time_elapsed         | 2706         |
|    total_timesteps      | 3667968      |
| train/                  |              |
|    approx_kl            | 0.0008821135 |
|    clip_fraction        | 0.0113       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0536      |
|    explained_variance   | 0.9          |
|    learning_rate        | 0.0003       |
|    loss                 | 7.71         |
|    n_updates            | 17900        |
|    policy_gradient_loss | -0.0019      |
|    value_loss           | 19.3         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.9         |
|    ep_rew_mean          | -97.9        |
| time/                   |              |
|    fps                  | 1354         |
|    iterations           | 1801         |
|    time_elapsed         | 2722         |
|    total_timesteps      | 3688448      |
| train/                  |              |
|    approx_kl            | 0.0052800225 |
|    clip_fraction        | 0.0288       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0445      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.109        |
|    n_updates            | 18000        |
|    policy_gradient_loss | -0.000731    |
|    value_loss           | 0.0574       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101         |
|    ep_rew_mean          | -101        |
| time/                   |             |
|    fps                  | 1355        |
|    iterations           | 1811        |
|    time_elapsed         | 2736        |
|    total_timesteps      | 3708928     |
| train/                  |             |
|    approx_kl            | 0.000714342 |
|    clip_fraction        | 0.00698     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0396     |
|    explained_variance   | 0.98        |
|    learning_rate        | 0.0003      |
|    loss                 | 0.265       |
|    n_updates            | 18100       |
|    policy_gradient_loss | -0.00223    |
|    value_loss           | 1.27        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101 

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98          |
|    ep_rew_mean          | -98         |
| time/                   |             |
|    fps                  | 1355        |
|    iterations           | 1821        |
|    time_elapsed         | 2751        |
|    total_timesteps      | 3729408     |
| train/                  |             |
|    approx_kl            | 0.004943808 |
|    clip_fraction        | 0.0145      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0249     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0144      |
|    n_updates            | 18200       |
|    policy_gradient_loss | -0.000584   |
|    value_loss           | 0.0291      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.1  

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 1831         |
|    time_elapsed         | 2766         |
|    total_timesteps      | 3749888      |
| train/                  |              |
|    approx_kl            | 0.0029979348 |
|    clip_fraction        | 0.0408       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0784      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0395       |
|    n_updates            | 18300        |
|    policy_gradient_loss | -0.00175     |
|    value_loss           | 0.0847       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 1841         |
|    time_elapsed         | 2780         |
|    total_timesteps      | 3770368      |
| train/                  |              |
|    approx_kl            | 0.0017614823 |
|    clip_fraction        | 0.0155       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0698      |
|    explained_variance   | 0.975        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.814        |
|    n_updates            | 18400        |
|    policy_gradient_loss | -0.00281     |
|    value_loss           | 6.24         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 1851         |
|    time_elapsed         | 2795         |
|    total_timesteps      | 3790848      |
| train/                  |              |
|    approx_kl            | 0.0020372262 |
|    clip_fraction        | 0.0189       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0599      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0171       |
|    n_updates            | 18500        |
|    policy_gradient_loss | 0.00119      |
|    value_loss           | 0.0414       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5         |
|    ep_rew_mean          | -98.5        |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 1861         |
|    time_elapsed         | 2809         |
|    total_timesteps      | 3811328      |
| train/                  |              |
|    approx_kl            | 0.0012431052 |
|    clip_fraction        | 0.0083       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.029       |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0208       |
|    n_updates            | 18600        |
|    policy_gradient_loss | -0.000466    |
|    value_loss           | 0.0492       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 102         |
|    ep_rew_mean          | -102        |
| time/                   |             |
|    fps                  | 1356        |
|    iterations           | 1871        |
|    time_elapsed         | 2823        |
|    total_timesteps      | 3831808     |
| train/                  |             |
|    approx_kl            | 0.014183633 |
|    clip_fraction        | 0.0186      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.036      |
|    explained_variance   | 0.996       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.132       |
|    n_updates            | 18700       |
|    policy_gradient_loss | -0.00117    |
|    value_loss           | 0.243       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 106         |
|    ep_rew_mean          | -106        |
| time/                   |             |
|    fps                  | 1356        |
|    iterations           | 1881        |
|    time_elapsed         | 2839        |
|    total_timesteps      | 3852288     |
| train/                  |             |
|    approx_kl            | 0.010986678 |
|    clip_fraction        | 0.0221      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0455     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0402      |
|    n_updates            | 18800       |
|    policy_gradient_loss | 0.00184     |
|    value_loss           | 0.123       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104 

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 102         |
|    ep_rew_mean          | -102        |
| time/                   |             |
|    fps                  | 1356        |
|    iterations           | 1891        |
|    time_elapsed         | 2854        |
|    total_timesteps      | 3872768     |
| train/                  |             |
|    approx_kl            | 0.029667713 |
|    clip_fraction        | 0.0543      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0777     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0106      |
|    n_updates            | 18900       |
|    policy_gradient_loss | -0.00816    |
|    value_loss           | 0.0722      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 1901         |
|    time_elapsed         | 2868         |
|    total_timesteps      | 3893248      |
| train/                  |              |
|    approx_kl            | 0.0008955684 |
|    clip_fraction        | 0.0121       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0719      |
|    explained_variance   | 0.986        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.219        |
|    n_updates            | 19000        |
|    policy_gradient_loss | -0.000194    |
|    value_loss           | 0.825        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.4        |
|    ep_rew_mean          | -99.4       |
| time/                   |             |
|    fps                  | 1357        |
|    iterations           | 1911        |
|    time_elapsed         | 2883        |
|    total_timesteps      | 3913728     |
| train/                  |             |
|    approx_kl            | 0.003407048 |
|    clip_fraction        | 0.025       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0572     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.278       |
|    n_updates            | 19100       |
|    policy_gradient_loss | -0.00184    |
|    value_loss           | 0.184       |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.6  

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.6        |
|    ep_rew_mean          | -98.6       |
| time/                   |             |
|    fps                  | 1357        |
|    iterations           | 1921        |
|    time_elapsed         | 2898        |
|    total_timesteps      | 3934208     |
| train/                  |             |
|    approx_kl            | 0.004681878 |
|    clip_fraction        | 0.0206      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0374     |
|    explained_variance   | 0.997       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0427      |
|    n_updates            | 19200       |
|    policy_gradient_loss | -0.00303    |
|    value_loss           | 0.16        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6         |
|    ep_rew_mean          | -99.6        |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 1931         |
|    time_elapsed         | 2914         |
|    total_timesteps      | 3954688      |
| train/                  |              |
|    approx_kl            | 0.0006576717 |
|    clip_fraction        | 0.0121       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0567      |
|    explained_variance   | 0.988        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.246        |
|    n_updates            | 19300        |
|    policy_gradient_loss | 0.00263      |
|    value_loss           | 0.643        |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100         |
|    ep_rew_mean          | -100        |
| time/                   |             |
|    fps                  | 1356        |
|    iterations           | 1941        |
|    time_elapsed         | 2930        |
|    total_timesteps      | 3975168     |
| train/                  |             |
|    approx_kl            | 0.001857871 |
|    clip_fraction        | 0.0133      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0472     |
|    explained_variance   | 0.968       |
|    learning_rate        | 0.0003      |
|    loss                 | 4.46        |
|    n_updates            | 19400       |
|    policy_gradient_loss | -0.00111    |
|    value_loss           | 9.16        |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.5         |
|    ep_rew_mean          | -99.5        |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 1951         |
|    time_elapsed         | 2945         |
|    total_timesteps      | 3995648      |
| train/                  |              |
|    approx_kl            | 0.0024256245 |
|    clip_fraction        | 0.0142       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0347      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0155       |
|    n_updates            | 19500        |
|    policy_gradient_loss | -8.8e-05     |
|    value_loss           | 0.0405       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6         |
|    ep_rew_mean          | -99.6        |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 1961         |
|    time_elapsed         | 2960         |
|    total_timesteps      | 4016128      |
| train/                  |              |
|    approx_kl            | 0.0016960538 |
|    clip_fraction        | 0.0211       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0463      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0189       |
|    n_updates            | 19600        |
|    policy_gradient_loss | -0.00241     |
|    value_loss           | 0.0413       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 1971         |
|    time_elapsed         | 2975         |
|    total_timesteps      | 4036608      |
| train/                  |              |
|    approx_kl            | 0.0011291188 |
|    clip_fraction        | 0.017        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.042       |
|    explained_variance   | 0.972        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.25         |
|    n_updates            | 19700        |
|    policy_gradient_loss | -0.0009      |
|    value_loss           | 6.01         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 103           |
|    ep_rew_mean          | -103          |
| time/                   |               |
|    fps                  | 1357          |
|    iterations           | 1981          |
|    time_elapsed         | 2989          |
|    total_timesteps      | 4057088       |
| train/                  |               |
|    approx_kl            | 0.00047382092 |
|    clip_fraction        | 0.00591       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.05         |
|    explained_variance   | 0.984         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.695         |
|    n_updates            | 19800         |
|    policy_gradient_loss | -0.00103      |
|    value_loss           | 4.38          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 1991         |
|    time_elapsed         | 3003         |
|    total_timesteps      | 4077568      |
| train/                  |              |
|    approx_kl            | 0.0010462921 |
|    clip_fraction        | 0.0139       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0636      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0341       |
|    n_updates            | 19900        |
|    policy_gradient_loss | 0.000151     |
|    value_loss           | 0.0828       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104          |
|    ep_rew_mean          | -104         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2001         |
|    time_elapsed         | 3017         |
|    total_timesteps      | 4098048      |
| train/                  |              |
|    approx_kl            | 0.0010700698 |
|    clip_fraction        | 0.0136       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0483      |
|    explained_variance   | 0.99         |
|    learning_rate        | 0.0003       |
|    loss                 | 0.531        |
|    n_updates            | 20000        |
|    policy_gradient_loss | 0.000187     |
|    value_loss           | 1.25         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2011         |
|    time_elapsed         | 3033         |
|    total_timesteps      | 4118528      |
| train/                  |              |
|    approx_kl            | 0.0023930098 |
|    clip_fraction        | 0.0201       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0333      |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0559       |
|    n_updates            | 20100        |
|    policy_gradient_loss | 0.00341      |
|    value_loss           | 0.129        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2021         |
|    time_elapsed         | 3050         |
|    total_timesteps      | 4139008      |
| train/                  |              |
|    approx_kl            | 0.0015810133 |
|    clip_fraction        | 0.0133       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0351      |
|    explained_variance   | 0.99         |
|    learning_rate        | 0.0003       |
|    loss                 | 0.974        |
|    n_updates            | 20200        |
|    policy_gradient_loss | -0.000974    |
|    value_loss           | 2.79         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2031         |
|    time_elapsed         | 3064         |
|    total_timesteps      | 4159488      |
| train/                  |              |
|    approx_kl            | 0.0045726323 |
|    clip_fraction        | 0.0312       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0824      |
|    explained_variance   | 0.991        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.289        |
|    n_updates            | 20300        |
|    policy_gradient_loss | -0.0033      |
|    value_loss           | 0.623        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 118          |
|    ep_rew_mean          | -118         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2041         |
|    time_elapsed         | 3079         |
|    total_timesteps      | 4179968      |
| train/                  |              |
|    approx_kl            | 0.0021374691 |
|    clip_fraction        | 0.0186       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0607      |
|    explained_variance   | 0.957        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.99         |
|    n_updates            | 20400        |
|    policy_gradient_loss | -0.00285     |
|    value_loss           | 6.12         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2051         |
|    time_elapsed         | 3093         |
|    total_timesteps      | 4200448      |
| train/                  |              |
|    approx_kl            | 0.0081104655 |
|    clip_fraction        | 0.0399       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0711      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0157       |
|    n_updates            | 20500        |
|    policy_gradient_loss | -0.00324     |
|    value_loss           | 0.0658       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101         |
|    ep_rew_mean          | -101        |
| time/                   |             |
|    fps                  | 1358        |
|    iterations           | 2061        |
|    time_elapsed         | 3107        |
|    total_timesteps      | 4220928     |
| train/                  |             |
|    approx_kl            | 0.004794931 |
|    clip_fraction        | 0.0323      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0738     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.042       |
|    n_updates            | 20600       |
|    policy_gradient_loss | 0.00108     |
|    value_loss           | 0.0726      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.2

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1358         |
|    iterations           | 2071         |
|    time_elapsed         | 3122         |
|    total_timesteps      | 4241408      |
| train/                  |              |
|    approx_kl            | 0.0030127761 |
|    clip_fraction        | 0.019        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.052       |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0725       |
|    n_updates            | 20700        |
|    policy_gradient_loss | -0.000146    |
|    value_loss           | 0.0803       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 97.9       |
|    ep_rew_mean          | -97.9      |
| time/                   |            |
|    fps                  | 1359       |
|    iterations           | 2081       |
|    time_elapsed         | 3135       |
|    total_timesteps      | 4261888    |
| train/                  |            |
|    approx_kl            | 0.00572055 |
|    clip_fraction        | 0.0252     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0477    |
|    explained_variance   | 1          |
|    learning_rate        | 0.0003     |
|    loss                 | 0.0248     |
|    n_updates            | 20800      |
|    policy_gradient_loss | -0.000794  |
|    value_loss           | 0.0352     |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.2         |
|    ep_re

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 96.4        |
|    ep_rew_mean          | -96.4       |
| time/                   |             |
|    fps                  | 1359        |
|    iterations           | 2091        |
|    time_elapsed         | 3149        |
|    total_timesteps      | 4282368     |
| train/                  |             |
|    approx_kl            | 0.004537141 |
|    clip_fraction        | 0.024       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0367     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.258       |
|    n_updates            | 20900       |
|    policy_gradient_loss | -0.00266    |
|    value_loss           | 0.104       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.9

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.2         |
|    ep_rew_mean          | -99.2        |
| time/                   |              |
|    fps                  | 1359         |
|    iterations           | 2101         |
|    time_elapsed         | 3164         |
|    total_timesteps      | 4302848      |
| train/                  |              |
|    approx_kl            | 0.0036241102 |
|    clip_fraction        | 0.0167       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0286      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0198       |
|    n_updates            | 21000        |
|    policy_gradient_loss | 0.00309      |
|    value_loss           | 0.0369       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5         |
|    ep_rew_mean          | -98.5        |
| time/                   |              |
|    fps                  | 1359         |
|    iterations           | 2111         |
|    time_elapsed         | 3180         |
|    total_timesteps      | 4323328      |
| train/                  |              |
|    approx_kl            | 0.0017563398 |
|    clip_fraction        | 0.0125       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0379      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0305       |
|    n_updates            | 21100        |
|    policy_gradient_loss | 0.00212      |
|    value_loss           | 0.0874       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.4         |
|    ep_rew_mean          | -99.4        |
| time/                   |              |
|    fps                  | 1359         |
|    iterations           | 2121         |
|    time_elapsed         | 3194         |
|    total_timesteps      | 4343808      |
| train/                  |              |
|    approx_kl            | 0.0064338357 |
|    clip_fraction        | 0.0234       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0457      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | -0.000758    |
|    n_updates            | 21200        |
|    policy_gradient_loss | -0.00182     |
|    value_loss           | 0.0218       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.6        |
|    ep_rew_mean          | -99.6       |
| time/                   |             |
|    fps                  | 1359        |
|    iterations           | 2131        |
|    time_elapsed         | 3210        |
|    total_timesteps      | 4364288     |
| train/                  |             |
|    approx_kl            | 0.012172111 |
|    clip_fraction        | 0.0334      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0529     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00423     |
|    n_updates            | 21300       |
|    policy_gradient_loss | -0.00176    |
|    value_loss           | 0.0262      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99  

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 97.2       |
|    ep_rew_mean          | -97.2      |
| time/                   |            |
|    fps                  | 1359       |
|    iterations           | 2141       |
|    time_elapsed         | 3225       |
|    total_timesteps      | 4384768    |
| train/                  |            |
|    approx_kl            | 0.00114952 |
|    clip_fraction        | 0.0146     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0333    |
|    explained_variance   | 1          |
|    learning_rate        | 0.0003     |
|    loss                 | 0.0119     |
|    n_updates            | 21400      |
|    policy_gradient_loss | 0.00116    |
|    value_loss           | 0.0302     |
----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.1        |
|    ep_rew_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1358         |
|    iterations           | 2151         |
|    time_elapsed         | 3241         |
|    total_timesteps      | 4405248      |
| train/                  |              |
|    approx_kl            | 0.0027846124 |
|    clip_fraction        | 0.0149       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0344      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0155       |
|    n_updates            | 21500        |
|    policy_gradient_loss | -0.000543    |
|    value_loss           | 0.0386       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 107          |
|    ep_rew_mean          | -107         |
| time/                   |              |
|    fps                  | 1358         |
|    iterations           | 2161         |
|    time_elapsed         | 3258         |
|    total_timesteps      | 4425728      |
| train/                  |              |
|    approx_kl            | 0.0021587163 |
|    clip_fraction        | 0.0126       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0354      |
|    explained_variance   | 0.975        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.537        |
|    n_updates            | 21600        |
|    policy_gradient_loss | -0.00159     |
|    value_loss           | 3.22         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100         |
|    ep_rew_mean          | -100        |
| time/                   |             |
|    fps                  | 1357        |
|    iterations           | 2171        |
|    time_elapsed         | 3275        |
|    total_timesteps      | 4446208     |
| train/                  |             |
|    approx_kl            | 0.003527937 |
|    clip_fraction        | 0.0205      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0473     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0203      |
|    n_updates            | 21700       |
|    policy_gradient_loss | -0.00043    |
|    value_loss           | 0.0348      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2181         |
|    time_elapsed         | 3289         |
|    total_timesteps      | 4466688      |
| train/                  |              |
|    approx_kl            | 0.0010191915 |
|    clip_fraction        | 0.0146       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0432      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0237       |
|    n_updates            | 21800        |
|    policy_gradient_loss | 0.00202      |
|    value_loss           | 0.0331       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1358         |
|    iterations           | 2191         |
|    time_elapsed         | 3303         |
|    total_timesteps      | 4487168      |
| train/                  |              |
|    approx_kl            | 0.0023673233 |
|    clip_fraction        | 0.0153       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0393      |
|    explained_variance   | 0.986        |
|    learning_rate        | 0.0003       |
|    loss                 | 9.83         |
|    n_updates            | 21900        |
|    policy_gradient_loss | -0.00109     |
|    value_loss           | 4.5          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 99.4       |
|    ep_rew_mean          | -99.4      |
| time/                   |            |
|    fps                  | 1357       |
|    iterations           | 2201       |
|    time_elapsed         | 3319       |
|    total_timesteps      | 4507648    |
| train/                  |            |
|    approx_kl            | 0.00168334 |
|    clip_fraction        | 0.019      |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0428    |
|    explained_variance   | 1          |
|    learning_rate        | 0.0003     |
|    loss                 | 0.0245     |
|    n_updates            | 22000      |
|    policy_gradient_loss | -0.00105   |
|    value_loss           | 0.0358     |
----------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 104        |
|    ep_rew_mean

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2211         |
|    time_elapsed         | 3334         |
|    total_timesteps      | 4528128      |
| train/                  |              |
|    approx_kl            | 0.0031443369 |
|    clip_fraction        | 0.0163       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0514      |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0273       |
|    n_updates            | 22100        |
|    policy_gradient_loss | 0.00322      |
|    value_loss           | 0.108        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.3         |
|    ep_rew_mean          | -99.3        |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2221         |
|    time_elapsed         | 3349         |
|    total_timesteps      | 4548608      |
| train/                  |              |
|    approx_kl            | 0.0005484184 |
|    clip_fraction        | 0.00942      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0478      |
|    explained_variance   | 0.962        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.07         |
|    n_updates            | 22200        |
|    policy_gradient_loss | 0.000513     |
|    value_loss           | 3.55         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2231         |
|    time_elapsed         | 3365         |
|    total_timesteps      | 4569088      |
| train/                  |              |
|    approx_kl            | 0.0006672746 |
|    clip_fraction        | 0.00869      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0357      |
|    explained_variance   | 0.984        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.547        |
|    n_updates            | 22300        |
|    policy_gradient_loss | -0.00133     |
|    value_loss           | 1.72         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2241         |
|    time_elapsed         | 3380         |
|    total_timesteps      | 4589568      |
| train/                  |              |
|    approx_kl            | 0.0009013181 |
|    clip_fraction        | 0.00586      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0348      |
|    explained_variance   | 0.965        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.13         |
|    n_updates            | 22400        |
|    policy_gradient_loss | 0.000191     |
|    value_loss           | 1.2          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 103         |
|    ep_rew_mean          | -103        |
| time/                   |             |
|    fps                  | 1357        |
|    iterations           | 2251        |
|    time_elapsed         | 3396        |
|    total_timesteps      | 4610048     |
| train/                  |             |
|    approx_kl            | 0.029244874 |
|    clip_fraction        | 0.045       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0468     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0199      |
|    n_updates            | 22500       |
|    policy_gradient_loss | -0.00308    |
|    value_loss           | 0.0622      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.9         |
|    ep_rew_mean          | -98.9        |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 2261         |
|    time_elapsed         | 3412         |
|    total_timesteps      | 4630528      |
| train/                  |              |
|    approx_kl            | 0.0037175447 |
|    clip_fraction        | 0.0275       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.052       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00115     |
|    n_updates            | 22600        |
|    policy_gradient_loss | 0.00129      |
|    value_loss           | 0.029        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 98.2       |
|    ep_rew_mean          | -98.2      |
| time/                   |            |
|    fps                  | 1356       |
|    iterations           | 2271       |
|    time_elapsed         | 3427       |
|    total_timesteps      | 4651008    |
| train/                  |            |
|    approx_kl            | 0.01365377 |
|    clip_fraction        | 0.0257     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0424    |
|    explained_variance   | 1          |
|    learning_rate        | 0.0003     |
|    loss                 | 0.366      |
|    n_updates            | 22700      |
|    policy_gradient_loss | 0.00362    |
|    value_loss           | 0.0355     |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.6         |
|    ep_re

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 2281         |
|    time_elapsed         | 3444         |
|    total_timesteps      | 4671488      |
| train/                  |              |
|    approx_kl            | 0.0017264124 |
|    clip_fraction        | 0.00801      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0373      |
|    explained_variance   | 0.973        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.55         |
|    n_updates            | 22800        |
|    policy_gradient_loss | 0.00125      |
|    value_loss           | 5.49         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.8         |
|    ep_rew_mean          | -98.8        |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 2291         |
|    time_elapsed         | 3459         |
|    total_timesteps      | 4691968      |
| train/                  |              |
|    approx_kl            | 0.0014312896 |
|    clip_fraction        | 0.0154       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0353      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0156       |
|    n_updates            | 22900        |
|    policy_gradient_loss | 0.000267     |
|    value_loss           | 0.0407       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 109          |
|    ep_rew_mean          | -109         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 2301         |
|    time_elapsed         | 3475         |
|    total_timesteps      | 4712448      |
| train/                  |              |
|    approx_kl            | 0.0006394362 |
|    clip_fraction        | 0.0105       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0358      |
|    explained_variance   | 0.976        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.37         |
|    n_updates            | 23000        |
|    policy_gradient_loss | -0.00059     |
|    value_loss           | 2.54         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 106           |
|    ep_rew_mean          | -106          |
| time/                   |               |
|    fps                  | 1355          |
|    iterations           | 2311          |
|    time_elapsed         | 3491          |
|    total_timesteps      | 4732928       |
| train/                  |               |
|    approx_kl            | 0.00065638707 |
|    clip_fraction        | 0.00796       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0428       |
|    explained_variance   | 0.965         |
|    learning_rate        | 0.0003        |
|    loss                 | 3.59          |
|    n_updates            | 23100         |
|    policy_gradient_loss | -0.00053      |
|    value_loss           | 3.67          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 112          |
|    ep_rew_mean          | -112         |
| time/                   |              |
|    fps                  | 1354         |
|    iterations           | 2321         |
|    time_elapsed         | 3508         |
|    total_timesteps      | 4753408      |
| train/                  |              |
|    approx_kl            | 0.0009423427 |
|    clip_fraction        | 0.0176       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0528      |
|    explained_variance   | 0.778        |
|    learning_rate        | 0.0003       |
|    loss                 | 5.47         |
|    n_updates            | 23200        |
|    policy_gradient_loss | 0.000543     |
|    value_loss           | 21.4         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 115          |
|    ep_rew_mean          | -115         |
| time/                   |              |
|    fps                  | 1354         |
|    iterations           | 2331         |
|    time_elapsed         | 3525         |
|    total_timesteps      | 4773888      |
| train/                  |              |
|    approx_kl            | 0.0015705763 |
|    clip_fraction        | 0.015        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0523      |
|    explained_variance   | 0.976        |
|    learning_rate        | 0.0003       |
|    loss                 | 5.24         |
|    n_updates            | 23300        |
|    policy_gradient_loss | -0.00129     |
|    value_loss           | 8.33         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 2341         |
|    time_elapsed         | 3540         |
|    total_timesteps      | 4794368      |
| train/                  |              |
|    approx_kl            | 0.0023348932 |
|    clip_fraction        | 0.021        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0471      |
|    explained_variance   | 0.984        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.316        |
|    n_updates            | 23400        |
|    policy_gradient_loss | -0.00058     |
|    value_loss           | 1.04         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1354         |
|    iterations           | 2351         |
|    time_elapsed         | 3555         |
|    total_timesteps      | 4814848      |
| train/                  |              |
|    approx_kl            | 0.0018854459 |
|    clip_fraction        | 0.0237       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0567      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0232       |
|    n_updates            | 23500        |
|    policy_gradient_loss | 2.51e-06     |
|    value_loss           | 0.0678       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 109         |
|    ep_rew_mean          | -109        |
| time/                   |             |
|    fps                  | 1353        |
|    iterations           | 2361        |
|    time_elapsed         | 3572        |
|    total_timesteps      | 4835328     |
| train/                  |             |
|    approx_kl            | 0.004085553 |
|    clip_fraction        | 0.0126      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0317     |
|    explained_variance   | 0.993       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.757       |
|    n_updates            | 23600       |
|    policy_gradient_loss | -0.00155    |
|    value_loss           | 1.53        |
-----------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 106     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.2         |
|    ep_rew_mean          | -98.2        |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 2371         |
|    time_elapsed         | 3588         |
|    total_timesteps      | 4855808      |
| train/                  |              |
|    approx_kl            | 0.0011287552 |
|    clip_fraction        | 0.00903      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0402      |
|    explained_variance   | 0.996        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0584       |
|    n_updates            | 23700        |
|    policy_gradient_loss | -0.00153     |
|    value_loss           | 0.215        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2381         |
|    time_elapsed         | 3604         |
|    total_timesteps      | 4876288      |
| train/                  |              |
|    approx_kl            | 0.0019606622 |
|    clip_fraction        | 0.0105       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0305      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0983       |
|    n_updates            | 23800        |
|    policy_gradient_loss | -0.000356    |
|    value_loss           | 0.373        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8         |
|    ep_rew_mean          | -97.8        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2391         |
|    time_elapsed         | 3619         |
|    total_timesteps      | 4896768      |
| train/                  |              |
|    approx_kl            | 0.0033330326 |
|    clip_fraction        | 0.0125       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0244      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0083       |
|    n_updates            | 23900        |
|    policy_gradient_loss | 0.000703     |
|    value_loss           | 0.0222       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.9        |
|    ep_rew_mean          | -99.9       |
| time/                   |             |
|    fps                  | 1352        |
|    iterations           | 2401        |
|    time_elapsed         | 3634        |
|    total_timesteps      | 4917248     |
| train/                  |             |
|    approx_kl            | 0.008839597 |
|    clip_fraction        | 0.017       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0401     |
|    explained_variance   | 0.995       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0843      |
|    n_updates            | 24000       |
|    policy_gradient_loss | -0.00144    |
|    value_loss           | 0.494       |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98           |
|    ep_rew_mean          | -98          |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2411         |
|    time_elapsed         | 3650         |
|    total_timesteps      | 4937728      |
| train/                  |              |
|    approx_kl            | 0.0026805769 |
|    clip_fraction        | 0.00996      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0354      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0155       |
|    n_updates            | 24100        |
|    policy_gradient_loss | 0.00176      |
|    value_loss           | 0.0294       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.5         |
|    ep_rew_mean          | -99.5        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2421         |
|    time_elapsed         | 3665         |
|    total_timesteps      | 4958208      |
| train/                  |              |
|    approx_kl            | 0.0038684288 |
|    clip_fraction        | 0.0126       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0298      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0103       |
|    n_updates            | 24200        |
|    policy_gradient_loss | -0.00204     |
|    value_loss           | 0.0652       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2431         |
|    time_elapsed         | 3680         |
|    total_timesteps      | 4978688      |
| train/                  |              |
|    approx_kl            | 0.0017532231 |
|    clip_fraction        | 0.0127       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0366      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00821      |
|    n_updates            | 24300        |
|    policy_gradient_loss | 0.00189      |
|    value_loss           | 0.02         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101         |
|    ep_rew_mean          | -101        |
| time/                   |             |
|    fps                  | 1352        |
|    iterations           | 2441        |
|    time_elapsed         | 3695        |
|    total_timesteps      | 4999168     |
| train/                  |             |
|    approx_kl            | 0.007066385 |
|    clip_fraction        | 0.0107      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0493     |
|    explained_variance   | 0.968       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0763      |
|    n_updates            | 24400       |
|    policy_gradient_loss | 0.00271     |
|    value_loss           | 3.3         |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 10

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.6         |
|    ep_rew_mean          | -97.6        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2451         |
|    time_elapsed         | 3711         |
|    total_timesteps      | 5019648      |
| train/                  |              |
|    approx_kl            | 0.0015140545 |
|    clip_fraction        | 0.0232       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0491      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0157       |
|    n_updates            | 24500        |
|    policy_gradient_loss | -0.00227     |
|    value_loss           | 0.0299       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2461         |
|    time_elapsed         | 3726         |
|    total_timesteps      | 5040128      |
| train/                  |              |
|    approx_kl            | 0.0019886969 |
|    clip_fraction        | 0.0119       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0343      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0249       |
|    n_updates            | 24600        |
|    policy_gradient_loss | 0.000943     |
|    value_loss           | 0.0903       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104          |
|    ep_rew_mean          | -104         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2471         |
|    time_elapsed         | 3741         |
|    total_timesteps      | 5060608      |
| train/                  |              |
|    approx_kl            | 0.0031336492 |
|    clip_fraction        | 0.0106       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0318      |
|    explained_variance   | 0.991        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.388        |
|    n_updates            | 24700        |
|    policy_gradient_loss | -0.00226     |
|    value_loss           | 0.771        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.5         |
|    ep_rew_mean          | -99.5        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2481         |
|    time_elapsed         | 3757         |
|    total_timesteps      | 5081088      |
| train/                  |              |
|    approx_kl            | 0.0011461554 |
|    clip_fraction        | 0.0122       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0443      |
|    explained_variance   | 0.994        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.135        |
|    n_updates            | 24800        |
|    policy_gradient_loss | 0.00113      |
|    value_loss           | 0.257        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.6         |
|    ep_rew_mean          | -97.6        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 2491         |
|    time_elapsed         | 3772         |
|    total_timesteps      | 5101568      |
| train/                  |              |
|    approx_kl            | 0.0009866816 |
|    clip_fraction        | 0.0138       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.034       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00884      |
|    n_updates            | 24900        |
|    policy_gradient_loss | 0.000241     |
|    value_loss           | 0.0395       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.6         |
|    ep_rew_mean          | -97.6        |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 2501         |
|    time_elapsed         | 3789         |
|    total_timesteps      | 5122048      |
| train/                  |              |
|    approx_kl            | 0.0074198185 |
|    clip_fraction        | 0.015        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0294      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00786     |
|    n_updates            | 25000        |
|    policy_gradient_loss | -0.00238     |
|    value_loss           | 0.0199       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 2511         |
|    time_elapsed         | 3805         |
|    total_timesteps      | 5142528      |
| train/                  |              |
|    approx_kl            | 0.0012562945 |
|    clip_fraction        | 0.00483      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0278      |
|    explained_variance   | 0.982        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.98         |
|    n_updates            | 25100        |
|    policy_gradient_loss | 0.000258     |
|    value_loss           | 2.65         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8         |
|    ep_rew_mean          | -97.8        |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 2521         |
|    time_elapsed         | 3822         |
|    total_timesteps      | 5163008      |
| train/                  |              |
|    approx_kl            | 0.0010787254 |
|    clip_fraction        | 0.0141       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0298      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0197       |
|    n_updates            | 25200        |
|    policy_gradient_loss | 0.00171      |
|    value_loss           | 0.0187       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 2531         |
|    time_elapsed         | 3837         |
|    total_timesteps      | 5183488      |
| train/                  |              |
|    approx_kl            | 0.0017002188 |
|    clip_fraction        | 0.00659      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.028       |
|    explained_variance   | 0.984        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0802       |
|    n_updates            | 25300        |
|    policy_gradient_loss | 0.000403     |
|    value_loss           | 1.34         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8         |
|    ep_rew_mean          | -97.8        |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 2541         |
|    time_elapsed         | 3852         |
|    total_timesteps      | 5203968      |
| train/                  |              |
|    approx_kl            | 0.0022549825 |
|    clip_fraction        | 0.0121       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0217      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00708      |
|    n_updates            | 25400        |
|    policy_gradient_loss | 0.00109      |
|    value_loss           | 0.034        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.1         |
|    ep_rew_mean          | -97.1        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 2551         |
|    time_elapsed         | 3870         |
|    total_timesteps      | 5224448      |
| train/                  |              |
|    approx_kl            | 0.0013512201 |
|    clip_fraction        | 0.0122       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.033       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0123       |
|    n_updates            | 25500        |
|    policy_gradient_loss | -3.47e-05    |
|    value_loss           | 0.0222       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.9         |
|    ep_rew_mean          | -98.9        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 2561         |
|    time_elapsed         | 3886         |
|    total_timesteps      | 5244928      |
| train/                  |              |
|    approx_kl            | 0.0098562315 |
|    clip_fraction        | 0.0189       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0313      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | -0.000884    |
|    n_updates            | 25600        |
|    policy_gradient_loss | -0.000508    |
|    value_loss           | 0.0267       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.5        |
|    ep_rew_mean          | -97.5       |
| time/                   |             |
|    fps                  | 1349        |
|    iterations           | 2571        |
|    time_elapsed         | 3901        |
|    total_timesteps      | 5265408     |
| train/                  |             |
|    approx_kl            | 0.001996403 |
|    clip_fraction        | 0.00923     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0296     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0146      |
|    n_updates            | 25700       |
|    policy_gradient_loss | 0.000853    |
|    value_loss           | 0.0219      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 97

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.8        |
|    ep_rew_mean          | -97.8       |
| time/                   |             |
|    fps                  | 1349        |
|    iterations           | 2581        |
|    time_elapsed         | 3916        |
|    total_timesteps      | 5285888     |
| train/                  |             |
|    approx_kl            | 0.002533838 |
|    clip_fraction        | 0.0127      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0211     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0107      |
|    n_updates            | 25800       |
|    policy_gradient_loss | 0.000458    |
|    value_loss           | 0.0196      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98  

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100         |
|    ep_rew_mean          | -100        |
| time/                   |             |
|    fps                  | 1349        |
|    iterations           | 2591        |
|    time_elapsed         | 3931        |
|    total_timesteps      | 5306368     |
| train/                  |             |
|    approx_kl            | 0.033184145 |
|    clip_fraction        | 0.0139      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0272     |
|    explained_variance   | 0.981       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.195       |
|    n_updates            | 25900       |
|    policy_gradient_loss | 0.0066      |
|    value_loss           | 0.958       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3         |
|    ep_rew_mean          | -98.3        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 2601         |
|    time_elapsed         | 3948         |
|    total_timesteps      | 5326848      |
| train/                  |              |
|    approx_kl            | 0.0064319326 |
|    clip_fraction        | 0.0115       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0207      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.016        |
|    n_updates            | 26000        |
|    policy_gradient_loss | -0.000434    |
|    value_loss           | 0.155        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.7        |
|    ep_rew_mean          | -98.7       |
| time/                   |             |
|    fps                  | 1348        |
|    iterations           | 2611        |
|    time_elapsed         | 3964        |
|    total_timesteps      | 5347328     |
| train/                  |             |
|    approx_kl            | 0.003536258 |
|    clip_fraction        | 0.0147      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.034      |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00462     |
|    n_updates            | 26100       |
|    policy_gradient_loss | -0.000284   |
|    value_loss           | 0.0195      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 108           |
|    ep_rew_mean          | -108          |
| time/                   |               |
|    fps                  | 1349          |
|    iterations           | 2621          |
|    time_elapsed         | 3978          |
|    total_timesteps      | 5367808       |
| train/                  |               |
|    approx_kl            | 0.00023539714 |
|    clip_fraction        | 0.00669       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0385       |
|    explained_variance   | 0.989         |
|    learning_rate        | 0.0003        |
|    loss                 | 3.01          |
|    n_updates            | 26200         |
|    policy_gradient_loss | -0.000823     |
|    value_loss           | 3.21          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.9         |
|    ep_rew_mean          | -97.9        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 2631         |
|    time_elapsed         | 3993         |
|    total_timesteps      | 5388288      |
| train/                  |              |
|    approx_kl            | 0.0018368545 |
|    clip_fraction        | 0.0114       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0281      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0159       |
|    n_updates            | 26300        |
|    policy_gradient_loss | -0.0011      |
|    value_loss           | 0.0272       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.8        |
|    ep_rew_mean          | -98.8       |
| time/                   |             |
|    fps                  | 1349        |
|    iterations           | 2641        |
|    time_elapsed         | 4008        |
|    total_timesteps      | 5408768     |
| train/                  |             |
|    approx_kl            | 0.007213501 |
|    clip_fraction        | 0.0184      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0359     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00992     |
|    n_updates            | 26400       |
|    policy_gradient_loss | 0.00198     |
|    value_loss           | 0.0239      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.3  

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98           |
|    ep_rew_mean          | -98          |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 2651         |
|    time_elapsed         | 4023         |
|    total_timesteps      | 5429248      |
| train/                  |              |
|    approx_kl            | 0.0039104386 |
|    clip_fraction        | 0.0195       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0358      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0117       |
|    n_updates            | 26500        |
|    policy_gradient_loss | 0.000382     |
|    value_loss           | 0.0204       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 103         |
|    ep_rew_mean          | -103        |
| time/                   |             |
|    fps                  | 1349        |
|    iterations           | 2661        |
|    time_elapsed         | 4038        |
|    total_timesteps      | 5449728     |
| train/                  |             |
|    approx_kl            | 0.000476908 |
|    clip_fraction        | 0.00581     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.03       |
|    explained_variance   | 0.95        |
|    learning_rate        | 0.0003      |
|    loss                 | 3.28        |
|    n_updates            | 26600       |
|    policy_gradient_loss | -0.00195    |
|    value_loss           | 10.2        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103 

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.2        |
|    ep_rew_mean          | -98.2       |
| time/                   |             |
|    fps                  | 1349        |
|    iterations           | 2671        |
|    time_elapsed         | 4052        |
|    total_timesteps      | 5470208     |
| train/                  |             |
|    approx_kl            | 0.002505983 |
|    clip_fraction        | 0.013       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0392     |
|    explained_variance   | 0.977       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0879      |
|    n_updates            | 26700       |
|    policy_gradient_loss | -0.00112    |
|    value_loss           | 1.5         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.8

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8         |
|    ep_rew_mean          | -97.8        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 2681         |
|    time_elapsed         | 4068         |
|    total_timesteps      | 5490688      |
| train/                  |              |
|    approx_kl            | 0.0020053526 |
|    clip_fraction        | 0.0155       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0425      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00557      |
|    n_updates            | 26800        |
|    policy_gradient_loss | 0.000307     |
|    value_loss           | 0.0184       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_rew_mean          | -106         |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 2691         |
|    time_elapsed         | 4084         |
|    total_timesteps      | 5511168      |
| train/                  |              |
|    approx_kl            | 0.0012678695 |
|    clip_fraction        | 0.0103       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0294      |
|    explained_variance   | 0.993        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.128        |
|    n_updates            | 26900        |
|    policy_gradient_loss | 0.000219     |
|    value_loss           | 0.337        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.9         |
|    ep_rew_mean          | -98.9        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 2701         |
|    time_elapsed         | 4099         |
|    total_timesteps      | 5531648      |
| train/                  |              |
|    approx_kl            | 0.0016651493 |
|    clip_fraction        | 0.0132       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0365      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.197        |
|    n_updates            | 27000        |
|    policy_gradient_loss | 0.00487      |
|    value_loss           | 0.0274       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 102         |
|    ep_rew_mean          | -102        |
| time/                   |             |
|    fps                  | 1349        |
|    iterations           | 2711        |
|    time_elapsed         | 4115        |
|    total_timesteps      | 5552128     |
| train/                  |             |
|    approx_kl            | 0.005698529 |
|    clip_fraction        | 0.0124      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0258     |
|    explained_variance   | 0.992       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.143       |
|    n_updates            | 27100       |
|    policy_gradient_loss | -0.000536   |
|    value_loss           | 1.42        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.8         |
|    ep_rew_mean          | -99.8        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 2721         |
|    time_elapsed         | 4130         |
|    total_timesteps      | 5572608      |
| train/                  |              |
|    approx_kl            | 0.0020463574 |
|    clip_fraction        | 0.0118       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0313      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0386       |
|    n_updates            | 27200        |
|    policy_gradient_loss | -0.000355    |
|    value_loss           | 0.0978       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.4        |
|    ep_rew_mean          | -99.4       |
| time/                   |             |
|    fps                  | 1348        |
|    iterations           | 2731        |
|    time_elapsed         | 4146        |
|    total_timesteps      | 5593088     |
| train/                  |             |
|    approx_kl            | 0.002400091 |
|    clip_fraction        | 0.0172      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0294     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00767     |
|    n_updates            | 27300       |
|    policy_gradient_loss | 0.000372    |
|    value_loss           | 0.0178      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100 

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.2        |
|    ep_rew_mean          | -97.2       |
| time/                   |             |
|    fps                  | 1348        |
|    iterations           | 2741        |
|    time_elapsed         | 4162        |
|    total_timesteps      | 5613568     |
| train/                  |             |
|    approx_kl            | 0.044075698 |
|    clip_fraction        | 0.0236      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0497     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0132      |
|    n_updates            | 27400       |
|    policy_gradient_loss | -0.002      |
|    value_loss           | 0.0199      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.7

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.4         |
|    ep_rew_mean          | -99.4        |
| time/                   |              |
|    fps                  | 1348         |
|    iterations           | 2751         |
|    time_elapsed         | 4176         |
|    total_timesteps      | 5634048      |
| train/                  |              |
|    approx_kl            | 0.0031641056 |
|    clip_fraction        | 0.0261       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0417      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00262     |
|    n_updates            | 27500        |
|    policy_gradient_loss | -0.0039      |
|    value_loss           | 0.0199       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.8         |
|    ep_rew_mean          | -98.8        |
| time/                   |              |
|    fps                  | 1348         |
|    iterations           | 2761         |
|    time_elapsed         | 4192         |
|    total_timesteps      | 5654528      |
| train/                  |              |
|    approx_kl            | 0.0057295687 |
|    clip_fraction        | 0.0232       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.036       |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.000326     |
|    n_updates            | 27600        |
|    policy_gradient_loss | 0.00251      |
|    value_loss           | 0.0432       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.2         |
|    ep_rew_mean          | -98.2        |
| time/                   |              |
|    fps                  | 1348         |
|    iterations           | 2771         |
|    time_elapsed         | 4207         |
|    total_timesteps      | 5675008      |
| train/                  |              |
|    approx_kl            | 0.0016016176 |
|    clip_fraction        | 0.013        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0321      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0154       |
|    n_updates            | 27700        |
|    policy_gradient_loss | 0.000751     |
|    value_loss           | 0.0188       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.6         |
|    ep_rew_mean          | -97.6        |
| time/                   |              |
|    fps                  | 1347         |
|    iterations           | 2781         |
|    time_elapsed         | 4225         |
|    total_timesteps      | 5695488      |
| train/                  |              |
|    approx_kl            | 0.0014827093 |
|    clip_fraction        | 0.0134       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.035       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00393      |
|    n_updates            | 27800        |
|    policy_gradient_loss | 0.00295      |
|    value_loss           | 0.0128       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 98.6      |
|    ep_rew_mean          | -98.6     |
| time/                   |           |
|    fps                  | 1346      |
|    iterations           | 2791      |
|    time_elapsed         | 4245      |
|    total_timesteps      | 5715968   |
| train/                  |           |
|    approx_kl            | 0.0015819 |
|    clip_fraction        | 0.0104    |
|    clip_range           | 0.2       |
|    entropy_loss         | -0.0308   |
|    explained_variance   | 1         |
|    learning_rate        | 0.0003    |
|    loss                 | 0.0208    |
|    n_updates            | 27900     |
|    policy_gradient_loss | -0.000739 |
|    value_loss           | 0.0342    |
---------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.2         |
|    ep_rew_mean          | -98

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.2         |
|    ep_rew_mean          | -98.2        |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 2801         |
|    time_elapsed         | 4260         |
|    total_timesteps      | 5736448      |
| train/                  |              |
|    approx_kl            | 0.0023297486 |
|    clip_fraction        | 0.0228       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0412      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0216       |
|    n_updates            | 28000        |
|    policy_gradient_loss | -0.00103     |
|    value_loss           | 0.0169       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.7        |
|    ep_rew_mean          | -98.7       |
| time/                   |             |
|    fps                  | 1346        |
|    iterations           | 2811        |
|    time_elapsed         | 4275        |
|    total_timesteps      | 5756928     |
| train/                  |             |
|    approx_kl            | 0.002039297 |
|    clip_fraction        | 0.013       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0306     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0102      |
|    n_updates            | 28100       |
|    policy_gradient_loss | 0.000632    |
|    value_loss           | 0.0223      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 97

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.7         |
|    ep_rew_mean          | -98.7        |
| time/                   |              |
|    fps                  | 1345         |
|    iterations           | 2821         |
|    time_elapsed         | 4293         |
|    total_timesteps      | 5777408      |
| train/                  |              |
|    approx_kl            | 0.0057810782 |
|    clip_fraction        | 0.0125       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0271      |
|    explained_variance   | 0.969        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.331        |
|    n_updates            | 28200        |
|    policy_gradient_loss | -0.00166     |
|    value_loss           | 4.36         |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1345         |
|    iterations           | 2831         |
|    time_elapsed         | 4308         |
|    total_timesteps      | 5797888      |
| train/                  |              |
|    approx_kl            | 0.0020256185 |
|    clip_fraction        | 0.00566      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0363      |
|    explained_variance   | 0.972        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.376        |
|    n_updates            | 28300        |
|    policy_gradient_loss | -0.00144     |
|    value_loss           | 2.26         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.6        |
|    ep_rew_mean          | -98.6       |
| time/                   |             |
|    fps                  | 1345        |
|    iterations           | 2841        |
|    time_elapsed         | 4323        |
|    total_timesteps      | 5818368     |
| train/                  |             |
|    approx_kl            | 0.001707307 |
|    clip_fraction        | 0.0173      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0399     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00748     |
|    n_updates            | 28400       |
|    policy_gradient_loss | 0.00062     |
|    value_loss           | 0.0207      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.8         |
|    ep_rew_mean          | -98.8        |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 2851         |
|    time_elapsed         | 4337         |
|    total_timesteps      | 5838848      |
| train/                  |              |
|    approx_kl            | 0.0033134704 |
|    clip_fraction        | 0.0154       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0273      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.06         |
|    n_updates            | 28500        |
|    policy_gradient_loss | 0.00093      |
|    value_loss           | 0.151        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.2        |
|    ep_rew_mean          | -98.2       |
| time/                   |             |
|    fps                  | 1346        |
|    iterations           | 2861        |
|    time_elapsed         | 4352        |
|    total_timesteps      | 5859328     |
| train/                  |             |
|    approx_kl            | 0.003833075 |
|    clip_fraction        | 0.0235      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0507     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | -0.00349    |
|    n_updates            | 28600       |
|    policy_gradient_loss | 0.00272     |
|    value_loss           | 0.0173      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.4  

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.7         |
|    ep_rew_mean          | -97.7        |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 2871         |
|    time_elapsed         | 4366         |
|    total_timesteps      | 5879808      |
| train/                  |              |
|    approx_kl            | 0.0059461077 |
|    clip_fraction        | 0.0165       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0297      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0103       |
|    n_updates            | 28700        |
|    policy_gradient_loss | -0.00158     |
|    value_loss           | 0.0204       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.3         |
|    ep_rew_mean          | -97.3        |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 2881         |
|    time_elapsed         | 4380         |
|    total_timesteps      | 5900288      |
| train/                  |              |
|    approx_kl            | 0.0016462153 |
|    clip_fraction        | 0.0158       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0462      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00138      |
|    n_updates            | 28800        |
|    policy_gradient_loss | -0.000307    |
|    value_loss           | 0.0216       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 95.6         |
|    ep_rew_mean          | -95.6        |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 2891         |
|    time_elapsed         | 4396         |
|    total_timesteps      | 5920768      |
| train/                  |              |
|    approx_kl            | 0.0006338702 |
|    clip_fraction        | 0.00933      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0275      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00856      |
|    n_updates            | 28900        |
|    policy_gradient_loss | 0.00104      |
|    value_loss           | 0.012        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 98.9          |
|    ep_rew_mean          | -98.9         |
| time/                   |               |
|    fps                  | 1346          |
|    iterations           | 2901          |
|    time_elapsed         | 4410          |
|    total_timesteps      | 5941248       |
| train/                  |               |
|    approx_kl            | 0.00027414894 |
|    clip_fraction        | 0.00342       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0254       |
|    explained_variance   | 0.996         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.208         |
|    n_updates            | 29000         |
|    policy_gradient_loss | 4.56e-05      |
|    value_loss           | 0.674         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.2        |
|    ep_rew_mean          | -98.2       |
| time/                   |             |
|    fps                  | 1346        |
|    iterations           | 2911        |
|    time_elapsed         | 4425        |
|    total_timesteps      | 5961728     |
| train/                  |             |
|    approx_kl            | 0.003521989 |
|    clip_fraction        | 0.0114      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0232     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0186      |
|    n_updates            | 29100       |
|    policy_gradient_loss | -0.000102   |
|    value_loss           | 0.0182      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.9

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.5         |
|    ep_rew_mean          | -97.5        |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 2921         |
|    time_elapsed         | 4442         |
|    total_timesteps      | 5982208      |
| train/                  |              |
|    approx_kl            | 0.0028039669 |
|    clip_fraction        | 0.0123       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0201      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00617      |
|    n_updates            | 29200        |
|    policy_gradient_loss | 0.00083      |
|    value_loss           | 0.0327       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 101           |
|    ep_rew_mean          | -101          |
| time/                   |               |
|    fps                  | 1346          |
|    iterations           | 2931          |
|    time_elapsed         | 4457          |
|    total_timesteps      | 6002688       |
| train/                  |               |
|    approx_kl            | 0.00030486216 |
|    clip_fraction        | 0.00181       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0178       |
|    explained_variance   | 0.993         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.129         |
|    n_updates            | 29300         |
|    policy_gradient_loss | -0.000813     |
|    value_loss           | 1.67          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.6         |
|    ep_rew_mean          | -97.6        |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 2941         |
|    time_elapsed         | 4472         |
|    total_timesteps      | 6023168      |
| train/                  |              |
|    approx_kl            | 0.0018279968 |
|    clip_fraction        | 0.0124       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0253      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0189       |
|    n_updates            | 29400        |
|    policy_gradient_loss | 0.00355      |
|    value_loss           | 0.0311       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1346         |
|    iterations           | 2951         |
|    time_elapsed         | 4487         |
|    total_timesteps      | 6043648      |
| train/                  |              |
|    approx_kl            | 0.0029971672 |
|    clip_fraction        | 0.0241       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0407      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0176       |
|    n_updates            | 29500        |
|    policy_gradient_loss | -0.000501    |
|    value_loss           | 0.0161       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.2        |
|    ep_rew_mean          | -97.2       |
| time/                   |             |
|    fps                  | 1346        |
|    iterations           | 2961        |
|    time_elapsed         | 4502        |
|    total_timesteps      | 6064128     |
| train/                  |             |
|    approx_kl            | 0.011487915 |
|    clip_fraction        | 0.018       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0265     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00993     |
|    n_updates            | 29600       |
|    policy_gradient_loss | -0.000512   |
|    value_loss           | 0.0184      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.4        |
|    ep_rew_mean          | -97.4       |
| time/                   |             |
|    fps                  | 1347        |
|    iterations           | 2971        |
|    time_elapsed         | 4516        |
|    total_timesteps      | 6084608     |
| train/                  |             |
|    approx_kl            | 0.003913716 |
|    clip_fraction        | 0.0204      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0309     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00614     |
|    n_updates            | 29700       |
|    policy_gradient_loss | 0.0128      |
|    value_loss           | 0.0176      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97  

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1347         |
|    iterations           | 2981         |
|    time_elapsed         | 4530         |
|    total_timesteps      | 6105088      |
| train/                  |              |
|    approx_kl            | 0.0017005582 |
|    clip_fraction        | 0.0148       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0298      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0041       |
|    n_updates            | 29800        |
|    policy_gradient_loss | -0.00142     |
|    value_loss           | 0.0168       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.5         |
|    ep_rew_mean          | -96.5        |
| time/                   |              |
|    fps                  | 1347         |
|    iterations           | 2991         |
|    time_elapsed         | 4544         |
|    total_timesteps      | 6125568      |
| train/                  |              |
|    approx_kl            | 0.0016913463 |
|    clip_fraction        | 0.00996      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0329      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00588      |
|    n_updates            | 29900        |
|    policy_gradient_loss | 0.00102      |
|    value_loss           | 0.0167       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.2         |
|    ep_rew_mean          | -97.2        |
| time/                   |              |
|    fps                  | 1348         |
|    iterations           | 3001         |
|    time_elapsed         | 4559         |
|    total_timesteps      | 6146048      |
| train/                  |              |
|    approx_kl            | 0.0020544408 |
|    clip_fraction        | 0.00806      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0159      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00526      |
|    n_updates            | 30000        |
|    policy_gradient_loss | 0.00108      |
|    value_loss           | 0.0159       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.9        |
|    ep_rew_mean          | -97.9       |
| time/                   |             |
|    fps                  | 1348        |
|    iterations           | 3011        |
|    time_elapsed         | 4573        |
|    total_timesteps      | 6166528     |
| train/                  |             |
|    approx_kl            | 0.006352653 |
|    clip_fraction        | 0.0154      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0211     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00228     |
|    n_updates            | 30100       |
|    policy_gradient_loss | -0.000277   |
|    value_loss           | 0.0141      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.1

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 101           |
|    ep_rew_mean          | -101          |
| time/                   |               |
|    fps                  | 1348          |
|    iterations           | 3021          |
|    time_elapsed         | 4587          |
|    total_timesteps      | 6187008       |
| train/                  |               |
|    approx_kl            | 0.00094929326 |
|    clip_fraction        | 0.0062        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0201       |
|    explained_variance   | 0.985         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.166         |
|    n_updates            | 30200         |
|    policy_gradient_loss | -0.000354     |
|    value_loss           | 1.59          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.3        |
|    ep_rew_mean          | -98.3       |
| time/                   |             |
|    fps                  | 1349        |
|    iterations           | 3031        |
|    time_elapsed         | 4601        |
|    total_timesteps      | 6207488     |
| train/                  |             |
|    approx_kl            | 0.018497031 |
|    clip_fraction        | 0.0215      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0288     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | -0.006      |
|    n_updates            | 30300       |
|    policy_gradient_loss | -0.00409    |
|    value_loss           | 0.0195      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.9  

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.6         |
|    ep_rew_mean          | -98.6        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 3041         |
|    time_elapsed         | 4615         |
|    total_timesteps      | 6227968      |
| train/                  |              |
|    approx_kl            | 0.0046300674 |
|    clip_fraction        | 0.0163       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0321      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00775      |
|    n_updates            | 30400        |
|    policy_gradient_loss | -0.000745    |
|    value_loss           | 0.0193       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.7        |
|    ep_rew_mean          | -99.7       |
| time/                   |             |
|    fps                  | 1349        |
|    iterations           | 3051        |
|    time_elapsed         | 4629        |
|    total_timesteps      | 6248448     |
| train/                  |             |
|    approx_kl            | 0.018008424 |
|    clip_fraction        | 0.0192      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0174     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0121      |
|    n_updates            | 30500       |
|    policy_gradient_loss | -0.00136    |
|    value_loss           | 0.0475      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.2         |
|    ep_rew_mean          | -97.2        |
| time/                   |              |
|    fps                  | 1349         |
|    iterations           | 3061         |
|    time_elapsed         | 4644         |
|    total_timesteps      | 6268928      |
| train/                  |              |
|    approx_kl            | 0.0030398124 |
|    clip_fraction        | 0.0139       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.032       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0188       |
|    n_updates            | 30600        |
|    policy_gradient_loss | 5.02e-05     |
|    value_loss           | 0.0291       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 99            |
|    ep_rew_mean          | -99           |
| time/                   |               |
|    fps                  | 1350          |
|    iterations           | 3071          |
|    time_elapsed         | 4658          |
|    total_timesteps      | 6289408       |
| train/                  |               |
|    approx_kl            | 0.00058800477 |
|    clip_fraction        | 0.0111        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0375       |
|    explained_variance   | 1             |
|    learning_rate        | 0.0003        |
|    loss                 | 0.00733       |
|    n_updates            | 30700         |
|    policy_gradient_loss | 0.000159      |
|    value_loss           | 0.0168        |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 98.1          |
|    ep_rew_mean          | -98.1         |
| time/                   |               |
|    fps                  | 1350          |
|    iterations           | 3081          |
|    time_elapsed         | 4672          |
|    total_timesteps      | 6309888       |
| train/                  |               |
|    approx_kl            | 0.00072857365 |
|    clip_fraction        | 0.0111        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0401       |
|    explained_variance   | 1             |
|    learning_rate        | 0.0003        |
|    loss                 | 0.00659       |
|    n_updates            | 30800         |
|    policy_gradient_loss | 0.00115       |
|    value_loss           | 0.0171        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.2         |
|    ep_rew_mean          | -99.2        |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3091         |
|    time_elapsed         | 4686         |
|    total_timesteps      | 6330368      |
| train/                  |              |
|    approx_kl            | 0.0031172414 |
|    clip_fraction        | 0.0106       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0217      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00933      |
|    n_updates            | 30900        |
|    policy_gradient_loss | -0.000451    |
|    value_loss           | 0.0416       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 98.6          |
|    ep_rew_mean          | -98.6         |
| time/                   |               |
|    fps                  | 1351          |
|    iterations           | 3101          |
|    time_elapsed         | 4700          |
|    total_timesteps      | 6350848       |
| train/                  |               |
|    approx_kl            | 0.00068765064 |
|    clip_fraction        | 0.0064        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0283       |
|    explained_variance   | 0.993         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.0503        |
|    n_updates            | 31000         |
|    policy_gradient_loss | -0.000218     |
|    value_loss           | 0.27          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.2         |
|    ep_rew_mean          | -99.2        |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3111         |
|    time_elapsed         | 4714         |
|    total_timesteps      | 6371328      |
| train/                  |              |
|    approx_kl            | 0.0062218076 |
|    clip_fraction        | 0.0134       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0274      |
|    explained_variance   | 0.979        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.37         |
|    n_updates            | 31100        |
|    policy_gradient_loss | 0.00435      |
|    value_loss           | 1.95         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 102           |
|    ep_rew_mean          | -102          |
| time/                   |               |
|    fps                  | 1351          |
|    iterations           | 3121          |
|    time_elapsed         | 4728          |
|    total_timesteps      | 6391808       |
| train/                  |               |
|    approx_kl            | 0.00013361935 |
|    clip_fraction        | 0.00264       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0276       |
|    explained_variance   | 0.988         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.414         |
|    n_updates            | 31200         |
|    policy_gradient_loss | -0.000699     |
|    value_loss           | 1.52          |
-------------------------------------------
------------------------------------------
| rollout/                |      

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 98.8       |
|    ep_rew_mean          | -98.8      |
| time/                   |            |
|    fps                  | 1351       |
|    iterations           | 3131       |
|    time_elapsed         | 4742       |
|    total_timesteps      | 6412288    |
| train/                  |            |
|    approx_kl            | 0.00298543 |
|    clip_fraction        | 0.0188     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0282    |
|    explained_variance   | 1          |
|    learning_rate        | 0.0003     |
|    loss                 | 0.00506    |
|    n_updates            | 31300      |
|    policy_gradient_loss | -0.00128   |
|    value_loss           | 0.0214     |
----------------------------------------
---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 99        |
|    ep_rew_mean   

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.5        |
|    ep_rew_mean          | -99.5       |
| time/                   |             |
|    fps                  | 1352        |
|    iterations           | 3141        |
|    time_elapsed         | 4756        |
|    total_timesteps      | 6432768     |
| train/                  |             |
|    approx_kl            | 0.003861913 |
|    clip_fraction        | 0.0112      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0205     |
|    explained_variance   | 0.996       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0616      |
|    n_updates            | 31400       |
|    policy_gradient_loss | -0.00128    |
|    value_loss           | 0.294       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99  

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3         |
|    ep_rew_mean          | -98.3        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 3151         |
|    time_elapsed         | 4772         |
|    total_timesteps      | 6453248      |
| train/                  |              |
|    approx_kl            | 0.0017560944 |
|    clip_fraction        | 0.00845      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0179      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0063       |
|    n_updates            | 31500        |
|    policy_gradient_loss | 0.00104      |
|    value_loss           | 0.0152       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.5         |
|    ep_rew_mean          | -99.5        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 3161         |
|    time_elapsed         | 4788         |
|    total_timesteps      | 6473728      |
| train/                  |              |
|    approx_kl            | 0.0017982003 |
|    clip_fraction        | 0.00723      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0196      |
|    explained_variance   | 0.991        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.121        |
|    n_updates            | 31600        |
|    policy_gradient_loss | -0.000134    |
|    value_loss           | 0.462        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3171         |
|    time_elapsed         | 4803         |
|    total_timesteps      | 6494208      |
| train/                  |              |
|    approx_kl            | 0.0021341331 |
|    clip_fraction        | 0.00752      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0284      |
|    explained_variance   | 0.993        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.557        |
|    n_updates            | 31700        |
|    policy_gradient_loss | -0.00181     |
|    value_loss           | 0.713        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.8         |
|    ep_rew_mean          | -98.8        |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3181         |
|    time_elapsed         | 4818         |
|    total_timesteps      | 6514688      |
| train/                  |              |
|    approx_kl            | 0.0057481593 |
|    clip_fraction        | 0.013        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0225      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00192      |
|    n_updates            | 31800        |
|    policy_gradient_loss | 1.77e-05     |
|    value_loss           | 0.0161       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.2         |
|    ep_rew_mean          | -99.2        |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3191         |
|    time_elapsed         | 4834         |
|    total_timesteps      | 6535168      |
| train/                  |              |
|    approx_kl            | 0.0029207875 |
|    clip_fraction        | 0.0125       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0216      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0119       |
|    n_updates            | 31900        |
|    policy_gradient_loss | 0.000529     |
|    value_loss           | 0.0164       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.7         |
|    ep_rew_mean          | -98.7        |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3201         |
|    time_elapsed         | 4848         |
|    total_timesteps      | 6555648      |
| train/                  |              |
|    approx_kl            | 0.0017642431 |
|    clip_fraction        | 0.0167       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0254      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00772      |
|    n_updates            | 32000        |
|    policy_gradient_loss | -0.00102     |
|    value_loss           | 0.0172       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5         |
|    ep_rew_mean          | -98.5        |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3211         |
|    time_elapsed         | 4864         |
|    total_timesteps      | 6576128      |
| train/                  |              |
|    approx_kl            | 0.0029900617 |
|    clip_fraction        | 0.0105       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0198      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00614      |
|    n_updates            | 32100        |
|    policy_gradient_loss | 0.00282      |
|    value_loss           | 0.0527       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 3221         |
|    time_elapsed         | 4878         |
|    total_timesteps      | 6596608      |
| train/                  |              |
|    approx_kl            | 0.0010142275 |
|    clip_fraction        | 0.00874      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0263      |
|    explained_variance   | 0.982        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.481        |
|    n_updates            | 32200        |
|    policy_gradient_loss | -0.00132     |
|    value_loss           | 1.78         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 3231         |
|    time_elapsed         | 4893         |
|    total_timesteps      | 6617088      |
| train/                  |              |
|    approx_kl            | 0.0046940856 |
|    clip_fraction        | 0.0128       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0209      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0191       |
|    n_updates            | 32300        |
|    policy_gradient_loss | 0.00024      |
|    value_loss           | 0.061        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.4         |
|    ep_rew_mean          | -98.4        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 3241         |
|    time_elapsed         | 4907         |
|    total_timesteps      | 6637568      |
| train/                  |              |
|    approx_kl            | 0.0011673414 |
|    clip_fraction        | 0.00879      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.031       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0199       |
|    n_updates            | 32400        |
|    policy_gradient_loss | -0.000566    |
|    value_loss           | 0.0248       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 100           |
|    ep_rew_mean          | -100          |
| time/                   |               |
|    fps                  | 1352          |
|    iterations           | 3251          |
|    time_elapsed         | 4922          |
|    total_timesteps      | 6658048       |
| train/                  |               |
|    approx_kl            | 0.00053713424 |
|    clip_fraction        | 0.0064        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0175       |
|    explained_variance   | 1             |
|    learning_rate        | 0.0003        |
|    loss                 | 0.0117        |
|    n_updates            | 32500         |
|    policy_gradient_loss | 0.000572      |
|    value_loss           | 0.0321        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.5         |
|    ep_rew_mean          | -99.5        |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 3261         |
|    time_elapsed         | 4938         |
|    total_timesteps      | 6678528      |
| train/                  |              |
|    approx_kl            | 0.0015232823 |
|    clip_fraction        | 0.00913      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0256      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0151       |
|    n_updates            | 32600        |
|    policy_gradient_loss | -0.000103    |
|    value_loss           | 0.0219       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.9         |
|    ep_rew_mean          | -97.9        |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3271         |
|    time_elapsed         | 4956         |
|    total_timesteps      | 6699008      |
| train/                  |              |
|    approx_kl            | 0.0004429055 |
|    clip_fraction        | 0.00493      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0198      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0105       |
|    n_updates            | 32700        |
|    policy_gradient_loss | -8.72e-05    |
|    value_loss           | 0.0165       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 98.7          |
|    ep_rew_mean          | -98.7         |
| time/                   |               |
|    fps                  | 1351          |
|    iterations           | 3281          |
|    time_elapsed         | 4973          |
|    total_timesteps      | 6719488       |
| train/                  |               |
|    approx_kl            | 0.00073606963 |
|    clip_fraction        | 0.0116        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0192       |
|    explained_variance   | 1             |
|    learning_rate        | 0.0003        |
|    loss                 | 0.000193      |
|    n_updates            | 32800         |
|    policy_gradient_loss | -0.000517     |
|    value_loss           | 0.0189        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.3        |
|    ep_rew_mean          | -99.3       |
| time/                   |             |
|    fps                  | 1351        |
|    iterations           | 3291        |
|    time_elapsed         | 4988        |
|    total_timesteps      | 6739968     |
| train/                  |             |
|    approx_kl            | 0.004934682 |
|    clip_fraction        | 0.0101      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0194     |
|    explained_variance   | 0.994       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0931      |
|    n_updates            | 32900       |
|    policy_gradient_loss | -0.000803   |
|    value_loss           | 0.252       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3301         |
|    time_elapsed         | 5004         |
|    total_timesteps      | 6760448      |
| train/                  |              |
|    approx_kl            | 0.0007831594 |
|    clip_fraction        | 0.0118       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0199      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.244        |
|    n_updates            | 33000        |
|    policy_gradient_loss | 0.00114      |
|    value_loss           | 1.27         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.4        |
|    ep_rew_mean          | -97.4       |
| time/                   |             |
|    fps                  | 1350        |
|    iterations           | 3311        |
|    time_elapsed         | 5019        |
|    total_timesteps      | 6780928     |
| train/                  |             |
|    approx_kl            | 0.004953128 |
|    clip_fraction        | 0.0131      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0196     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00438     |
|    n_updates            | 33100       |
|    policy_gradient_loss | -0.00109    |
|    value_loss           | 0.022       |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.5  

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.5        |
|    ep_rew_mean          | -99.5       |
| time/                   |             |
|    fps                  | 1350        |
|    iterations           | 3321        |
|    time_elapsed         | 5034        |
|    total_timesteps      | 6801408     |
| train/                  |             |
|    approx_kl            | 0.002054697 |
|    clip_fraction        | 0.0126      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0244     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00885     |
|    n_updates            | 33200       |
|    policy_gradient_loss | 0.00209     |
|    value_loss           | 0.0465      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.3

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 116           |
|    ep_rew_mean          | -116          |
| time/                   |               |
|    fps                  | 1350          |
|    iterations           | 3331          |
|    time_elapsed         | 5049          |
|    total_timesteps      | 6821888       |
| train/                  |               |
|    approx_kl            | 0.00069220737 |
|    clip_fraction        | 0.00605       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0434       |
|    explained_variance   | 0.96          |
|    learning_rate        | 0.0003        |
|    loss                 | 3.95          |
|    n_updates            | 33300         |
|    policy_gradient_loss | -0.00198      |
|    value_loss           | 9.86          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3341         |
|    time_elapsed         | 5065         |
|    total_timesteps      | 6842368      |
| train/                  |              |
|    approx_kl            | 0.0027657833 |
|    clip_fraction        | 0.00781      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0224      |
|    explained_variance   | 0.988        |
|    learning_rate        | 0.0003       |
|    loss                 | 3.4          |
|    n_updates            | 33400        |
|    policy_gradient_loss | -0.000476    |
|    value_loss           | 1.9          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3351         |
|    time_elapsed         | 5080         |
|    total_timesteps      | 6862848      |
| train/                  |              |
|    approx_kl            | 0.0010190124 |
|    clip_fraction        | 0.00874      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0211      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0426       |
|    n_updates            | 33500        |
|    policy_gradient_loss | 0.00157      |
|    value_loss           | 0.0511       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99          |
|    ep_rew_mean          | -99         |
| time/                   |             |
|    fps                  | 1350        |
|    iterations           | 3361        |
|    time_elapsed         | 5095        |
|    total_timesteps      | 6883328     |
| train/                  |             |
|    approx_kl            | 0.004914986 |
|    clip_fraction        | 0.0164      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0362     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0146      |
|    n_updates            | 33600       |
|    policy_gradient_loss | 4.14e-05    |
|    value_loss           | 0.0216      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99          |
|    ep_rew_mean          | -99         |
| time/                   |             |
|    fps                  | 1350        |
|    iterations           | 3371        |
|    time_elapsed         | 5110        |
|    total_timesteps      | 6903808     |
| train/                  |             |
|    approx_kl            | 0.006807981 |
|    clip_fraction        | 0.0209      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0434     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00793     |
|    n_updates            | 33700       |
|    policy_gradient_loss | 0.00123     |
|    value_loss           | 0.024       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.1

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 108           |
|    ep_rew_mean          | -108          |
| time/                   |               |
|    fps                  | 1350          |
|    iterations           | 3381          |
|    time_elapsed         | 5127          |
|    total_timesteps      | 6924288       |
| train/                  |               |
|    approx_kl            | 0.00053936464 |
|    clip_fraction        | 0.00391       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0335       |
|    explained_variance   | 0.986         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.622         |
|    n_updates            | 33800         |
|    policy_gradient_loss | -0.000961     |
|    value_loss           | 2.55          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3391         |
|    time_elapsed         | 5144         |
|    total_timesteps      | 6944768      |
| train/                  |              |
|    approx_kl            | 0.0030470039 |
|    clip_fraction        | 0.017        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0327      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0466       |
|    n_updates            | 33900        |
|    policy_gradient_loss | 0.00114      |
|    value_loss           | 0.0705       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3         |
|    ep_rew_mean          | -98.3        |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3401         |
|    time_elapsed         | 5159         |
|    total_timesteps      | 6965248      |
| train/                  |              |
|    approx_kl            | 0.0020210585 |
|    clip_fraction        | 0.0124       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0327      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.012        |
|    n_updates            | 34000        |
|    policy_gradient_loss | 0.00076      |
|    value_loss           | 0.0299       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99           |
|    ep_rew_mean          | -99          |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3411         |
|    time_elapsed         | 5173         |
|    total_timesteps      | 6985728      |
| train/                  |              |
|    approx_kl            | 0.0031200894 |
|    clip_fraction        | 0.0176       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0304      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.013        |
|    n_updates            | 34100        |
|    policy_gradient_loss | 0.000778     |
|    value_loss           | 0.0455       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 105           |
|    ep_rew_mean          | -105          |
| time/                   |               |
|    fps                  | 1350          |
|    iterations           | 3421          |
|    time_elapsed         | 5187          |
|    total_timesteps      | 7006208       |
| train/                  |               |
|    approx_kl            | 0.00037264862 |
|    clip_fraction        | 0.00552       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0473       |
|    explained_variance   | 0.961         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.455         |
|    n_updates            | 34200         |
|    policy_gradient_loss | 0.000488      |
|    value_loss           | 5.21          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104          |
|    ep_rew_mean          | -104         |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3431         |
|    time_elapsed         | 5202         |
|    total_timesteps      | 7026688      |
| train/                  |              |
|    approx_kl            | 0.0015450497 |
|    clip_fraction        | 0.0161       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0402      |
|    explained_variance   | 0.991        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.302        |
|    n_updates            | 34300        |
|    policy_gradient_loss | 0.00367      |
|    value_loss           | 1.38         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3441         |
|    time_elapsed         | 5217         |
|    total_timesteps      | 7047168      |
| train/                  |              |
|    approx_kl            | 0.0019028976 |
|    clip_fraction        | 0.0268       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0436      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0116       |
|    n_updates            | 34400        |
|    policy_gradient_loss | -0.000957    |
|    value_loss           | 0.0461       |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 118          |
|    ep_rew_mean          | -118         |
| time/                   |              |
|    fps                  | 1350         |
|    iterations           | 3451         |
|    time_elapsed         | 5231         |
|    total_timesteps      | 7067648      |
| train/                  |              |
|    approx_kl            | 0.0012681498 |
|    clip_fraction        | 0.0118       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0411      |
|    explained_variance   | 0.977        |
|    learning_rate        | 0.0003       |
|    loss                 | 1.79         |
|    n_updates            | 34500        |
|    policy_gradient_loss | -0.00181     |
|    value_loss           | 3.54         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3461         |
|    time_elapsed         | 5245         |
|    total_timesteps      | 7088128      |
| train/                  |              |
|    approx_kl            | 0.0005388857 |
|    clip_fraction        | 0.00713      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0368      |
|    explained_variance   | 0.965        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.52         |
|    n_updates            | 34600        |
|    policy_gradient_loss | 0.00115      |
|    value_loss           | 4.82         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 102        |
|    ep_rew_mean          | -102       |
| time/                   |            |
|    fps                  | 1351       |
|    iterations           | 3471       |
|    time_elapsed         | 5260       |
|    total_timesteps      | 7108608    |
| train/                  |            |
|    approx_kl            | 0.00099437 |
|    clip_fraction        | 0.0107     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0311    |
|    explained_variance   | 0.991      |
|    learning_rate        | 0.0003     |
|    loss                 | 0.114      |
|    n_updates            | 34700      |
|    policy_gradient_loss | -0.000738  |
|    value_loss           | 0.511      |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_re

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.8        |
|    ep_rew_mean          | -98.8       |
| time/                   |             |
|    fps                  | 1351        |
|    iterations           | 3481        |
|    time_elapsed         | 5274        |
|    total_timesteps      | 7129088     |
| train/                  |             |
|    approx_kl            | 0.002064458 |
|    clip_fraction        | 0.0146      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0393     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.011       |
|    n_updates            | 34800       |
|    policy_gradient_loss | 0.000394    |
|    value_loss           | 0.0274      |
-----------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 98.6    

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3491         |
|    time_elapsed         | 5288         |
|    total_timesteps      | 7149568      |
| train/                  |              |
|    approx_kl            | 0.0029811626 |
|    clip_fraction        | 0.00728      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0377      |
|    explained_variance   | 0.994        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.236        |
|    n_updates            | 34900        |
|    policy_gradient_loss | -0.000704    |
|    value_loss           | 0.376        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1351         |
|    iterations           | 3501         |
|    time_elapsed         | 5304         |
|    total_timesteps      | 7170048      |
| train/                  |              |
|    approx_kl            | 0.0035184012 |
|    clip_fraction        | 0.00923      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0287      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0464       |
|    n_updates            | 35000        |
|    policy_gradient_loss | -0.000657    |
|    value_loss           | 0.224        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.4        |
|    ep_rew_mean          | -98.4       |
| time/                   |             |
|    fps                  | 1352        |
|    iterations           | 3511        |
|    time_elapsed         | 5318        |
|    total_timesteps      | 7190528     |
| train/                  |             |
|    approx_kl            | 0.008198865 |
|    clip_fraction        | 0.0229      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.039      |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00461     |
|    n_updates            | 35100       |
|    policy_gradient_loss | 0.0112      |
|    value_loss           | 0.0297      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 118          |
|    ep_rew_mean          | -118         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 3521         |
|    time_elapsed         | 5332         |
|    total_timesteps      | 7211008      |
| train/                  |              |
|    approx_kl            | 0.0025393358 |
|    clip_fraction        | 0.0226       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0449      |
|    explained_variance   | 0.993        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.519        |
|    n_updates            | 35200        |
|    policy_gradient_loss | -0.000679    |
|    value_loss           | 1.29         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 3531         |
|    time_elapsed         | 5346         |
|    total_timesteps      | 7231488      |
| train/                  |              |
|    approx_kl            | 0.0032418997 |
|    clip_fraction        | 0.0128       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0351      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0135       |
|    n_updates            | 35300        |
|    policy_gradient_loss | -0.00123     |
|    value_loss           | 0.0517       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1352         |
|    iterations           | 3541         |
|    time_elapsed         | 5360         |
|    total_timesteps      | 7251968      |
| train/                  |              |
|    approx_kl            | 0.0012042345 |
|    clip_fraction        | 0.004        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0294      |
|    explained_variance   | 0.992        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.15         |
|    n_updates            | 35400        |
|    policy_gradient_loss | 0.00103      |
|    value_loss           | 0.73         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 3551         |
|    time_elapsed         | 5374         |
|    total_timesteps      | 7272448      |
| train/                  |              |
|    approx_kl            | 0.0042707482 |
|    clip_fraction        | 0.0102       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0334      |
|    explained_variance   | 0.997        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.033        |
|    n_updates            | 35500        |
|    policy_gradient_loss | 0.00051      |
|    value_loss           | 0.151        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.7         |
|    ep_rew_mean          | -97.7        |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 3561         |
|    time_elapsed         | 5389         |
|    total_timesteps      | 7292928      |
| train/                  |              |
|    approx_kl            | 0.0011674846 |
|    clip_fraction        | 0.0128       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0342      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0206       |
|    n_updates            | 35600        |
|    policy_gradient_loss | -0.000264    |
|    value_loss           | 0.0379       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 3571         |
|    time_elapsed         | 5403         |
|    total_timesteps      | 7313408      |
| train/                  |              |
|    approx_kl            | 0.0057325386 |
|    clip_fraction        | 0.0146       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0317      |
|    explained_variance   | 0.996        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.26         |
|    n_updates            | 35700        |
|    policy_gradient_loss | -0.000478    |
|    value_loss           | 1.13         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.4         |
|    ep_rew_mean          | -99.4        |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 3581         |
|    time_elapsed         | 5417         |
|    total_timesteps      | 7333888      |
| train/                  |              |
|    approx_kl            | 0.0004635207 |
|    clip_fraction        | 0.00767      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0443      |
|    explained_variance   | 0.996        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0539       |
|    n_updates            | 35800        |
|    policy_gradient_loss | -0.000145    |
|    value_loss           | 0.129        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1353         |
|    iterations           | 3591         |
|    time_elapsed         | 5431         |
|    total_timesteps      | 7354368      |
| train/                  |              |
|    approx_kl            | 0.0007795443 |
|    clip_fraction        | 0.00332      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0412      |
|    explained_variance   | 0.973        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.134        |
|    n_updates            | 35900        |
|    policy_gradient_loss | 0.000565     |
|    value_loss           | 2.58         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.8        |
|    ep_rew_mean          | -98.8       |
| time/                   |             |
|    fps                  | 1354        |
|    iterations           | 3601        |
|    time_elapsed         | 5445        |
|    total_timesteps      | 7374848     |
| train/                  |             |
|    approx_kl            | 0.000762834 |
|    clip_fraction        | 0.0138      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.04       |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0199      |
|    n_updates            | 36000       |
|    policy_gradient_loss | -0.00145    |
|    value_loss           | 0.037       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 99.7       |
|    ep_rew_mean          | -99.7      |
| time/                   |            |
|    fps                  | 1354       |
|    iterations           | 3611       |
|    time_elapsed         | 5459       |
|    total_timesteps      | 7395328    |
| train/                  |            |
|    approx_kl            | 0.01590341 |
|    clip_fraction        | 0.00684    |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0302    |
|    explained_variance   | 0.993      |
|    learning_rate        | 0.0003     |
|    loss                 | 0.0474     |
|    n_updates            | 36100      |
|    policy_gradient_loss | -0.000928  |
|    value_loss           | 0.358      |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_re

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.7        |
|    ep_rew_mean          | -97.7       |
| time/                   |             |
|    fps                  | 1354        |
|    iterations           | 3621        |
|    time_elapsed         | 5473        |
|    total_timesteps      | 7415808     |
| train/                  |             |
|    approx_kl            | 0.004397112 |
|    clip_fraction        | 0.0138      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.029      |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0132      |
|    n_updates            | 36200       |
|    policy_gradient_loss | 0.00258     |
|    value_loss           | 0.0482      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.9         |
|    ep_rew_mean          | -98.9        |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 3631         |
|    time_elapsed         | 5488         |
|    total_timesteps      | 7436288      |
| train/                  |              |
|    approx_kl            | 0.0017467686 |
|    clip_fraction        | 0.0135       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0368      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0138       |
|    n_updates            | 36300        |
|    policy_gradient_loss | 0.000679     |
|    value_loss           | 0.0343       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 3641         |
|    time_elapsed         | 5502         |
|    total_timesteps      | 7456768      |
| train/                  |              |
|    approx_kl            | 0.0012512107 |
|    clip_fraction        | 0.00889      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0384      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0139       |
|    n_updates            | 36400        |
|    policy_gradient_loss | 0.000106     |
|    value_loss           | 0.0512       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 3651         |
|    time_elapsed         | 5516         |
|    total_timesteps      | 7477248      |
| train/                  |              |
|    approx_kl            | 0.0061648088 |
|    clip_fraction        | 0.0221       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0384      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0104       |
|    n_updates            | 36500        |
|    policy_gradient_loss | -0.000689    |
|    value_loss           | 0.0236       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.3         |
|    ep_rew_mean          | -99.3        |
| time/                   |              |
|    fps                  | 1355         |
|    iterations           | 3661         |
|    time_elapsed         | 5530         |
|    total_timesteps      | 7497728      |
| train/                  |              |
|    approx_kl            | 0.0004259007 |
|    clip_fraction        | 0.00405      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0412      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.143        |
|    n_updates            | 36600        |
|    policy_gradient_loss | 0.000646     |
|    value_loss           | 0.691        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.5         |
|    ep_rew_mean          | -99.5        |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 3671         |
|    time_elapsed         | 5544         |
|    total_timesteps      | 7518208      |
| train/                  |              |
|    approx_kl            | 0.0019781296 |
|    clip_fraction        | 0.00488      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0241      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.445        |
|    n_updates            | 36700        |
|    policy_gradient_loss | -0.000424    |
|    value_loss           | 1.28         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 97.3       |
|    ep_rew_mean          | -97.3      |
| time/                   |            |
|    fps                  | 1356       |
|    iterations           | 3681       |
|    time_elapsed         | 5558       |
|    total_timesteps      | 7538688    |
| train/                  |            |
|    approx_kl            | 0.04067584 |
|    clip_fraction        | 0.039      |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0388    |
|    explained_variance   | 1          |
|    learning_rate        | 0.0003     |
|    loss                 | -0.028     |
|    n_updates            | 36800      |
|    policy_gradient_loss | -0.00321   |
|    value_loss           | 0.0211     |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.9         |
|    ep_re

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.8        |
|    ep_rew_mean          | -97.8       |
| time/                   |             |
|    fps                  | 1356        |
|    iterations           | 3691        |
|    time_elapsed         | 5572        |
|    total_timesteps      | 7559168     |
| train/                  |             |
|    approx_kl            | 0.025502147 |
|    clip_fraction        | 0.0208      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0265     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | -0.00211    |
|    n_updates            | 36900       |
|    policy_gradient_loss | -0.000884   |
|    value_loss           | 0.021       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.1

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1356         |
|    iterations           | 3701         |
|    time_elapsed         | 5586         |
|    total_timesteps      | 7579648      |
| train/                  |              |
|    approx_kl            | 0.0006760922 |
|    clip_fraction        | 0.00508      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.031       |
|    explained_variance   | 0.993        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.19         |
|    n_updates            | 37000        |
|    policy_gradient_loss | -0.000919    |
|    value_loss           | 1.51         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104          |
|    ep_rew_mean          | -104         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 3711         |
|    time_elapsed         | 5600         |
|    total_timesteps      | 7600128      |
| train/                  |              |
|    approx_kl            | 0.0008973062 |
|    clip_fraction        | 0.00693      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0222      |
|    explained_variance   | 0.968        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.131        |
|    n_updates            | 37100        |
|    policy_gradient_loss | -0.000474    |
|    value_loss           | 1.52         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.5        |
|    ep_rew_mean          | -98.5       |
| time/                   |             |
|    fps                  | 1357        |
|    iterations           | 3721        |
|    time_elapsed         | 5614        |
|    total_timesteps      | 7620608     |
| train/                  |             |
|    approx_kl            | 0.000685244 |
|    clip_fraction        | 0.0135      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0376     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0165      |
|    n_updates            | 37200       |
|    policy_gradient_loss | -0.000503   |
|    value_loss           | 0.0463      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.5

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 108          |
|    ep_rew_mean          | -108         |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 3731         |
|    time_elapsed         | 5628         |
|    total_timesteps      | 7641088      |
| train/                  |              |
|    approx_kl            | 0.0046598027 |
|    clip_fraction        | 0.0157       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0391      |
|    explained_variance   | 0.977        |
|    learning_rate        | 0.0003       |
|    loss                 | 5.23         |
|    n_updates            | 37300        |
|    policy_gradient_loss | -0.00324     |
|    value_loss           | 7.64         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6         |
|    ep_rew_mean          | -99.6        |
| time/                   |              |
|    fps                  | 1357         |
|    iterations           | 3741         |
|    time_elapsed         | 5642         |
|    total_timesteps      | 7661568      |
| train/                  |              |
|    approx_kl            | 0.0014382779 |
|    clip_fraction        | 0.0121       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0285      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.042        |
|    n_updates            | 37400        |
|    policy_gradient_loss | -0.000964    |
|    value_loss           | 0.0282       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.5         |
|    ep_rew_mean          | -96.5        |
| time/                   |              |
|    fps                  | 1358         |
|    iterations           | 3751         |
|    time_elapsed         | 5656         |
|    total_timesteps      | 7682048      |
| train/                  |              |
|    approx_kl            | 0.0020480813 |
|    clip_fraction        | 0.0154       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0274      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00149      |
|    n_updates            | 37500        |
|    policy_gradient_loss | -0.00128     |
|    value_loss           | 0.022        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 98.5          |
|    ep_rew_mean          | -98.5         |
| time/                   |               |
|    fps                  | 1358          |
|    iterations           | 3761          |
|    time_elapsed         | 5670          |
|    total_timesteps      | 7702528       |
| train/                  |               |
|    approx_kl            | 0.00094826956 |
|    clip_fraction        | 0.0114        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0329       |
|    explained_variance   | 0.993         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.065         |
|    n_updates            | 37600         |
|    policy_gradient_loss | -0.00122      |
|    value_loss           | 0.343         |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1358         |
|    iterations           | 3771         |
|    time_elapsed         | 5684         |
|    total_timesteps      | 7723008      |
| train/                  |              |
|    approx_kl            | 0.0016202256 |
|    clip_fraction        | 0.0109       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0294      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0154       |
|    n_updates            | 37700        |
|    policy_gradient_loss | -0.000641    |
|    value_loss           | 0.0347       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 98.2          |
|    ep_rew_mean          | -98.2         |
| time/                   |               |
|    fps                  | 1358          |
|    iterations           | 3781          |
|    time_elapsed         | 5698          |
|    total_timesteps      | 7743488       |
| train/                  |               |
|    approx_kl            | 0.00040464272 |
|    clip_fraction        | 0.00386       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0283       |
|    explained_variance   | 0.972         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.166         |
|    n_updates            | 37800         |
|    policy_gradient_loss | -0.00124      |
|    value_loss           | 2.84          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1358         |
|    iterations           | 3791         |
|    time_elapsed         | 5713         |
|    total_timesteps      | 7763968      |
| train/                  |              |
|    approx_kl            | 0.0007700812 |
|    clip_fraction        | 0.00659      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0414      |
|    explained_variance   | 0.979        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.396        |
|    n_updates            | 37900        |
|    policy_gradient_loss | -0.0018      |
|    value_loss           | 1.22         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 119          |
|    ep_rew_mean          | -119         |
| time/                   |              |
|    fps                  | 1359         |
|    iterations           | 3801         |
|    time_elapsed         | 5727         |
|    total_timesteps      | 7784448      |
| train/                  |              |
|    approx_kl            | 0.0009800997 |
|    clip_fraction        | 0.0152       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0596      |
|    explained_variance   | 0.955        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.65         |
|    n_updates            | 38000        |
|    policy_gradient_loss | -0.00374     |
|    value_loss           | 10.8         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1359         |
|    iterations           | 3811         |
|    time_elapsed         | 5741         |
|    total_timesteps      | 7804928      |
| train/                  |              |
|    approx_kl            | 0.0038160014 |
|    clip_fraction        | 0.016        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0606      |
|    explained_variance   | 0.997        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.043        |
|    n_updates            | 38100        |
|    policy_gradient_loss | 0.00147      |
|    value_loss           | 0.174        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1359         |
|    iterations           | 3821         |
|    time_elapsed         | 5755         |
|    total_timesteps      | 7825408      |
| train/                  |              |
|    approx_kl            | 0.0049580256 |
|    clip_fraction        | 0.0194       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0387      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0135       |
|    n_updates            | 38200        |
|    policy_gradient_loss | -0.000725    |
|    value_loss           | 0.0237       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.7         |
|    ep_rew_mean          | -98.7        |
| time/                   |              |
|    fps                  | 1359         |
|    iterations           | 3831         |
|    time_elapsed         | 5769         |
|    total_timesteps      | 7845888      |
| train/                  |              |
|    approx_kl            | 0.0017039914 |
|    clip_fraction        | 0.00845      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0233      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.014        |
|    n_updates            | 38300        |
|    policy_gradient_loss | 4.64e-05     |
|    value_loss           | 0.0261       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 102         |
|    ep_rew_mean          | -102        |
| time/                   |             |
|    fps                  | 1360        |
|    iterations           | 3841        |
|    time_elapsed         | 5783        |
|    total_timesteps      | 7866368     |
| train/                  |             |
|    approx_kl            | 0.010879904 |
|    clip_fraction        | 0.0275      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.031      |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0277      |
|    n_updates            | 38400       |
|    policy_gradient_loss | 0.00115     |
|    value_loss           | 0.0531      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101   

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 104           |
|    ep_rew_mean          | -104          |
| time/                   |               |
|    fps                  | 1360          |
|    iterations           | 3851          |
|    time_elapsed         | 5797          |
|    total_timesteps      | 7886848       |
| train/                  |               |
|    approx_kl            | 0.00089324324 |
|    clip_fraction        | 0.00723       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0305       |
|    explained_variance   | 0.984         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.692         |
|    n_updates            | 38500         |
|    policy_gradient_loss | -1.46e-05     |
|    value_loss           | 3.94          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 99.5          |
|    ep_rew_mean          | -99.5         |
| time/                   |               |
|    fps                  | 1360          |
|    iterations           | 3861          |
|    time_elapsed         | 5813          |
|    total_timesteps      | 7907328       |
| train/                  |               |
|    approx_kl            | 0.00036322034 |
|    clip_fraction        | 0.0064        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0231       |
|    explained_variance   | 0.986         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.634         |
|    n_updates            | 38600         |
|    policy_gradient_loss | 0.00035       |
|    value_loss           | 1.83          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 104           |
|    ep_rew_mean          | -104          |
| time/                   |               |
|    fps                  | 1360          |
|    iterations           | 3871          |
|    time_elapsed         | 5827          |
|    total_timesteps      | 7927808       |
| train/                  |               |
|    approx_kl            | 0.00014072863 |
|    clip_fraction        | 0.00469       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0191       |
|    explained_variance   | 0.988         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.626         |
|    n_updates            | 38700         |
|    policy_gradient_loss | 0.000483      |
|    value_loss           | 1.66          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.1         |
|    ep_rew_mean          | -98.1        |
| time/                   |              |
|    fps                  | 1360         |
|    iterations           | 3881         |
|    time_elapsed         | 5842         |
|    total_timesteps      | 7948288      |
| train/                  |              |
|    approx_kl            | 0.0016590416 |
|    clip_fraction        | 0.0116       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0298      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0123       |
|    n_updates            | 38800        |
|    policy_gradient_loss | 0.000393     |
|    value_loss           | 0.0231       |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99           |
|    ep_rew_mean          | -99          |
| time/                   |              |
|    fps                  | 1360         |
|    iterations           | 3891         |
|    time_elapsed         | 5856         |
|    total_timesteps      | 7968768      |
| train/                  |              |
|    approx_kl            | 0.0034649184 |
|    clip_fraction        | 0.0083       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0229      |
|    explained_variance   | 0.993        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0399       |
|    n_updates            | 38900        |
|    policy_gradient_loss | -0.00168     |
|    value_loss           | 0.435        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1360         |
|    iterations           | 3901         |
|    time_elapsed         | 5871         |
|    total_timesteps      | 7989248      |
| train/                  |              |
|    approx_kl            | 0.0005076316 |
|    clip_fraction        | 0.00513      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0262      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0428       |
|    n_updates            | 39000        |
|    policy_gradient_loss | 0.000493     |
|    value_loss           | 0.185        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.3         |
|    ep_rew_mean          | -97.3        |
| time/                   |              |
|    fps                  | 1360         |
|    iterations           | 3911         |
|    time_elapsed         | 5885         |
|    total_timesteps      | 8009728      |
| train/                  |              |
|    approx_kl            | 0.0009901942 |
|    clip_fraction        | 0.00937      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0207      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0065       |
|    n_updates            | 39100        |
|    policy_gradient_loss | -0.000266    |
|    value_loss           | 0.0182       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3         |
|    ep_rew_mean          | -98.3        |
| time/                   |              |
|    fps                  | 1361         |
|    iterations           | 3921         |
|    time_elapsed         | 5899         |
|    total_timesteps      | 8030208      |
| train/                  |              |
|    approx_kl            | 0.0013565349 |
|    clip_fraction        | 0.0118       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.021       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0272       |
|    n_updates            | 39200        |
|    policy_gradient_loss | 5.75e-05     |
|    value_loss           | 0.0244       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.1        |
|    ep_rew_mean          | -97.1       |
| time/                   |             |
|    fps                  | 1361        |
|    iterations           | 3931        |
|    time_elapsed         | 5913        |
|    total_timesteps      | 8050688     |
| train/                  |             |
|    approx_kl            | 0.004918342 |
|    clip_fraction        | 0.0115      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0161     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00254     |
|    n_updates            | 39300       |
|    policy_gradient_loss | -0.00137    |
|    value_loss           | 0.0218      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 96

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.8        |
|    ep_rew_mean          | -97.8       |
| time/                   |             |
|    fps                  | 1361        |
|    iterations           | 3941        |
|    time_elapsed         | 5927        |
|    total_timesteps      | 8071168     |
| train/                  |             |
|    approx_kl            | 0.010636164 |
|    clip_fraction        | 0.0104      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0151     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0187      |
|    n_updates            | 39400       |
|    policy_gradient_loss | -0.00154    |
|    value_loss           | 0.0596      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.4  

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101         |
|    ep_rew_mean          | -101        |
| time/                   |             |
|    fps                  | 1361        |
|    iterations           | 3951        |
|    time_elapsed         | 5941        |
|    total_timesteps      | 8091648     |
| train/                  |             |
|    approx_kl            | 0.028954221 |
|    clip_fraction        | 0.0217      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0257     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00642     |
|    n_updates            | 39500       |
|    policy_gradient_loss | 0.00117     |
|    value_loss           | 0.025       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 10

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.5        |
|    ep_rew_mean          | -99.5       |
| time/                   |             |
|    fps                  | 1362        |
|    iterations           | 3961        |
|    time_elapsed         | 5955        |
|    total_timesteps      | 8112128     |
| train/                  |             |
|    approx_kl            | 0.005774988 |
|    clip_fraction        | 0.0147      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.024      |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0698      |
|    n_updates            | 39600       |
|    policy_gradient_loss | 0.00143     |
|    value_loss           | 0.142       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.6        |
|    ep_rew_mean          | -98.6       |
| time/                   |             |
|    fps                  | 1362        |
|    iterations           | 3971        |
|    time_elapsed         | 5969        |
|    total_timesteps      | 8132608     |
| train/                  |             |
|    approx_kl            | 0.003443761 |
|    clip_fraction        | 0.0145      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0229     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | -0.000511   |
|    n_updates            | 39700       |
|    policy_gradient_loss | -0.000927   |
|    value_loss           | 0.0213      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.4

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 105          |
|    ep_rew_mean          | -105         |
| time/                   |              |
|    fps                  | 1362         |
|    iterations           | 3981         |
|    time_elapsed         | 5983         |
|    total_timesteps      | 8153088      |
| train/                  |              |
|    approx_kl            | 0.0005460838 |
|    clip_fraction        | 0.00313      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0241      |
|    explained_variance   | 0.984        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0939       |
|    n_updates            | 39800        |
|    policy_gradient_loss | -0.00114     |
|    value_loss           | 1.18         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.8         |
|    ep_rew_mean          | -98.8        |
| time/                   |              |
|    fps                  | 1362         |
|    iterations           | 3991         |
|    time_elapsed         | 5997         |
|    total_timesteps      | 8173568      |
| train/                  |              |
|    approx_kl            | 0.0012256135 |
|    clip_fraction        | 0.0121       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0288      |
|    explained_variance   | 0.993        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.289        |
|    n_updates            | 39900        |
|    policy_gradient_loss | 0.00174      |
|    value_loss           | 0.894        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104          |
|    ep_rew_mean          | -104         |
| time/                   |              |
|    fps                  | 1362         |
|    iterations           | 4001         |
|    time_elapsed         | 6012         |
|    total_timesteps      | 8194048      |
| train/                  |              |
|    approx_kl            | 0.0019198877 |
|    clip_fraction        | 0.00767      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0233      |
|    explained_variance   | 0.987        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.062        |
|    n_updates            | 40000        |
|    policy_gradient_loss | -0.000891    |
|    value_loss           | 0.439        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1362         |
|    iterations           | 4011         |
|    time_elapsed         | 6027         |
|    total_timesteps      | 8214528      |
| train/                  |              |
|    approx_kl            | 0.0013203439 |
|    clip_fraction        | 0.00757      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0275      |
|    explained_variance   | 0.991        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0589       |
|    n_updates            | 40100        |
|    policy_gradient_loss | -0.000197    |
|    value_loss           | 0.324        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1363         |
|    iterations           | 4021         |
|    time_elapsed         | 6041         |
|    total_timesteps      | 8235008      |
| train/                  |              |
|    approx_kl            | 0.0015408457 |
|    clip_fraction        | 0.0101       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.042       |
|    explained_variance   | 0.996        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0657       |
|    n_updates            | 40200        |
|    policy_gradient_loss | -0.000936    |
|    value_loss           | 0.157        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.6         |
|    ep_rew_mean          | -98.6        |
| time/                   |              |
|    fps                  | 1363         |
|    iterations           | 4031         |
|    time_elapsed         | 6055         |
|    total_timesteps      | 8255488      |
| train/                  |              |
|    approx_kl            | 0.0027251113 |
|    clip_fraction        | 0.0203       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0334      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0213       |
|    n_updates            | 40300        |
|    policy_gradient_loss | 0.00626      |
|    value_loss           | 0.0396       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1363         |
|    iterations           | 4041         |
|    time_elapsed         | 6069         |
|    total_timesteps      | 8275968      |
| train/                  |              |
|    approx_kl            | 0.0012319068 |
|    clip_fraction        | 0.00786      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.024       |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.336        |
|    n_updates            | 40400        |
|    policy_gradient_loss | -0.000198    |
|    value_loss           | 0.55         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.2        |
|    ep_rew_mean          | -99.2       |
| time/                   |             |
|    fps                  | 1363        |
|    iterations           | 4051        |
|    time_elapsed         | 6083        |
|    total_timesteps      | 8296448     |
| train/                  |             |
|    approx_kl            | 0.004970678 |
|    clip_fraction        | 0.0149      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0209     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0113      |
|    n_updates            | 40500       |
|    policy_gradient_loss | 0.000122    |
|    value_loss           | 0.0199      |
-----------------------------------------
---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 98.5      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1363         |
|    iterations           | 4061         |
|    time_elapsed         | 6097         |
|    total_timesteps      | 8316928      |
| train/                  |              |
|    approx_kl            | 0.0034154598 |
|    clip_fraction        | 0.0159       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.022       |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.063        |
|    n_updates            | 40600        |
|    policy_gradient_loss | 0.00189      |
|    value_loss           | 0.193        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 104          |
|    ep_rew_mean          | -104         |
| time/                   |              |
|    fps                  | 1364         |
|    iterations           | 4071         |
|    time_elapsed         | 6111         |
|    total_timesteps      | 8337408      |
| train/                  |              |
|    approx_kl            | 0.0029461011 |
|    clip_fraction        | 0.0116       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0218      |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0491       |
|    n_updates            | 40700        |
|    policy_gradient_loss | 0.000445     |
|    value_loss           | 0.106        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 102           |
|    ep_rew_mean          | -102          |
| time/                   |               |
|    fps                  | 1364          |
|    iterations           | 4081          |
|    time_elapsed         | 6126          |
|    total_timesteps      | 8357888       |
| train/                  |               |
|    approx_kl            | 0.00079271704 |
|    clip_fraction        | 0.00566       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0224       |
|    explained_variance   | 0.989         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.166         |
|    n_updates            | 40800         |
|    policy_gradient_loss | -0.00157      |
|    value_loss           | 0.575         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6         |
|    ep_rew_mean          | -99.6        |
| time/                   |              |
|    fps                  | 1363         |
|    iterations           | 4091         |
|    time_elapsed         | 6142         |
|    total_timesteps      | 8378368      |
| train/                  |              |
|    approx_kl            | 0.0013224947 |
|    clip_fraction        | 0.00972      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0282      |
|    explained_variance   | 0.997        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0186       |
|    n_updates            | 40900        |
|    policy_gradient_loss | -0.000204    |
|    value_loss           | 0.124        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1364         |
|    iterations           | 4101         |
|    time_elapsed         | 6156         |
|    total_timesteps      | 8398848      |
| train/                  |              |
|    approx_kl            | 0.0020812145 |
|    clip_fraction        | 0.015        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0291      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.012        |
|    n_updates            | 41000        |
|    policy_gradient_loss | -0.00137     |
|    value_loss           | 0.0332       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.6        |
|    ep_rew_mean          | -98.6       |
| time/                   |             |
|    fps                  | 1364        |
|    iterations           | 4111        |
|    time_elapsed         | 6171        |
|    total_timesteps      | 8419328     |
| train/                  |             |
|    approx_kl            | 0.005756148 |
|    clip_fraction        | 0.0158      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0345     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00866     |
|    n_updates            | 41100       |
|    policy_gradient_loss | 0.00238     |
|    value_loss           | 0.0236      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98  

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 99.4          |
|    ep_rew_mean          | -99.4         |
| time/                   |               |
|    fps                  | 1364          |
|    iterations           | 4121          |
|    time_elapsed         | 6186          |
|    total_timesteps      | 8439808       |
| train/                  |               |
|    approx_kl            | 0.00091648154 |
|    clip_fraction        | 0.00894       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0238       |
|    explained_variance   | 0.999         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.0249        |
|    n_updates            | 41200         |
|    policy_gradient_loss | 0.000817      |
|    value_loss           | 0.0949        |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.7         |
|    ep_rew_mean          | -97.7        |
| time/                   |              |
|    fps                  | 1363         |
|    iterations           | 4131         |
|    time_elapsed         | 6202         |
|    total_timesteps      | 8460288      |
| train/                  |              |
|    approx_kl            | 0.0010861616 |
|    clip_fraction        | 0.00688      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0236      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0116       |
|    n_updates            | 41300        |
|    policy_gradient_loss | 0.000483     |
|    value_loss           | 0.0188       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.7         |
|    ep_rew_mean          | -99.7        |
| time/                   |              |
|    fps                  | 1363         |
|    iterations           | 4141         |
|    time_elapsed         | 6217         |
|    total_timesteps      | 8480768      |
| train/                  |              |
|    approx_kl            | 0.0017708848 |
|    clip_fraction        | 0.00913      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.024       |
|    explained_variance   | 0.984        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.708        |
|    n_updates            | 41400        |
|    policy_gradient_loss | -0.00102     |
|    value_loss           | 1.56         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.1         |
|    ep_rew_mean          | -97.1        |
| time/                   |              |
|    fps                  | 1364         |
|    iterations           | 4151         |
|    time_elapsed         | 6231         |
|    total_timesteps      | 8501248      |
| train/                  |              |
|    approx_kl            | 0.0018412826 |
|    clip_fraction        | 0.013        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0232      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00925      |
|    n_updates            | 41500        |
|    policy_gradient_loss | -0.000303    |
|    value_loss           | 0.022        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1364         |
|    iterations           | 4161         |
|    time_elapsed         | 6247         |
|    total_timesteps      | 8521728      |
| train/                  |              |
|    approx_kl            | 0.0037849934 |
|    clip_fraction        | 0.0116       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0219      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0012       |
|    n_updates            | 41600        |
|    policy_gradient_loss | 0.000838     |
|    value_loss           | 0.0349       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.3        |
|    ep_rew_mean          | -98.3       |
| time/                   |             |
|    fps                  | 1363        |
|    iterations           | 4171        |
|    time_elapsed         | 6262        |
|    total_timesteps      | 8542208     |
| train/                  |             |
|    approx_kl            | 0.000626264 |
|    clip_fraction        | 0.00542     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0243     |
|    explained_variance   | 0.977       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.289       |
|    n_updates            | 41700       |
|    policy_gradient_loss | -0.000868   |
|    value_loss           | 2.32        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.4

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 99.6          |
|    ep_rew_mean          | -99.6         |
| time/                   |               |
|    fps                  | 1363          |
|    iterations           | 4181          |
|    time_elapsed         | 6278          |
|    total_timesteps      | 8562688       |
| train/                  |               |
|    approx_kl            | 0.00052486174 |
|    clip_fraction        | 0.00415       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0224       |
|    explained_variance   | 0.963         |
|    learning_rate        | 0.0003        |
|    loss                 | 11.3          |
|    n_updates            | 41800         |
|    policy_gradient_loss | -0.00133      |
|    value_loss           | 5.29          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.2        |
|    ep_rew_mean          | -98.2       |
| time/                   |             |
|    fps                  | 1363        |
|    iterations           | 4191        |
|    time_elapsed         | 6293        |
|    total_timesteps      | 8583168     |
| train/                  |             |
|    approx_kl            | 0.004993214 |
|    clip_fraction        | 0.0111      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0216     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00834     |
|    n_updates            | 41900       |
|    policy_gradient_loss | 0.00746     |
|    value_loss           | 0.0224      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.8

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 107          |
|    ep_rew_mean          | -107         |
| time/                   |              |
|    fps                  | 1363         |
|    iterations           | 4201         |
|    time_elapsed         | 6308         |
|    total_timesteps      | 8603648      |
| train/                  |              |
|    approx_kl            | 0.0006599311 |
|    clip_fraction        | 0.00537      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0204      |
|    explained_variance   | 0.977        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.5          |
|    n_updates            | 42000        |
|    policy_gradient_loss | -0.000553    |
|    value_loss           | 6.27         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 99.5          |
|    ep_rew_mean          | -99.5         |
| time/                   |               |
|    fps                  | 1363          |
|    iterations           | 4211          |
|    time_elapsed         | 6323          |
|    total_timesteps      | 8624128       |
| train/                  |               |
|    approx_kl            | 0.00037740773 |
|    clip_fraction        | 0.0153        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0258       |
|    explained_variance   | 0.988         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.522         |
|    n_updates            | 42100         |
|    policy_gradient_loss | 0.000134      |
|    value_loss           | 1.14          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 110           |
|    ep_rew_mean          | -110          |
| time/                   |               |
|    fps                  | 1364          |
|    iterations           | 4221          |
|    time_elapsed         | 6337          |
|    total_timesteps      | 8644608       |
| train/                  |               |
|    approx_kl            | 0.00024267288 |
|    clip_fraction        | 0.00166       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0333       |
|    explained_variance   | 0.962         |
|    learning_rate        | 0.0003        |
|    loss                 | 5.66          |
|    n_updates            | 42200         |
|    policy_gradient_loss | -0.000345     |
|    value_loss           | 6.79          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1364         |
|    iterations           | 4231         |
|    time_elapsed         | 6351         |
|    total_timesteps      | 8665088      |
| train/                  |              |
|    approx_kl            | 0.0030127035 |
|    clip_fraction        | 0.0237       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0341      |
|    explained_variance   | 0.998        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0465       |
|    n_updates            | 42300        |
|    policy_gradient_loss | -0.000996    |
|    value_loss           | 0.152        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 99.7          |
|    ep_rew_mean          | -99.7         |
| time/                   |               |
|    fps                  | 1364          |
|    iterations           | 4241          |
|    time_elapsed         | 6365          |
|    total_timesteps      | 8685568       |
| train/                  |               |
|    approx_kl            | 0.00053595495 |
|    clip_fraction        | 0.00762       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0208       |
|    explained_variance   | 0.999         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.0159        |
|    n_updates            | 42400         |
|    policy_gradient_loss | 9.95e-06      |
|    value_loss           | 0.0484        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8         |
|    ep_rew_mean          | -97.8        |
| time/                   |              |
|    fps                  | 1364         |
|    iterations           | 4251         |
|    time_elapsed         | 6379         |
|    total_timesteps      | 8706048      |
| train/                  |              |
|    approx_kl            | 0.0020940048 |
|    clip_fraction        | 0.0112       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0265      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.000362     |
|    n_updates            | 42500        |
|    policy_gradient_loss | 0.000395     |
|    value_loss           | 0.0139       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.3         |
|    ep_rew_mean          | -96.3        |
| time/                   |              |
|    fps                  | 1364         |
|    iterations           | 4261         |
|    time_elapsed         | 6393         |
|    total_timesteps      | 8726528      |
| train/                  |              |
|    approx_kl            | 0.0048086885 |
|    clip_fraction        | 0.0109       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0182      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.014        |
|    n_updates            | 42600        |
|    policy_gradient_loss | 0.000765     |
|    value_loss           | 0.0191       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1365         |
|    iterations           | 4271         |
|    time_elapsed         | 6407         |
|    total_timesteps      | 8747008      |
| train/                  |              |
|    approx_kl            | 0.0006952271 |
|    clip_fraction        | 0.00439      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0244      |
|    explained_variance   | 0.99         |
|    learning_rate        | 0.0003       |
|    loss                 | 0.249        |
|    n_updates            | 42700        |
|    policy_gradient_loss | -0.00114     |
|    value_loss           | 1.99         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.4         |
|    ep_rew_mean          | -98.4        |
| time/                   |              |
|    fps                  | 1365         |
|    iterations           | 4281         |
|    time_elapsed         | 6421         |
|    total_timesteps      | 8767488      |
| train/                  |              |
|    approx_kl            | 0.0050437977 |
|    clip_fraction        | 0.0128       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.019       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00193     |
|    n_updates            | 42800        |
|    policy_gradient_loss | -0.000774    |
|    value_loss           | 0.0194       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98           |
|    ep_rew_mean          | -98          |
| time/                   |              |
|    fps                  | 1365         |
|    iterations           | 4291         |
|    time_elapsed         | 6435         |
|    total_timesteps      | 8787968      |
| train/                  |              |
|    approx_kl            | 0.0008763424 |
|    clip_fraction        | 0.00977      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.019       |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.011        |
|    n_updates            | 42900        |
|    policy_gradient_loss | 0.000663     |
|    value_loss           | 0.0516       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3         |
|    ep_rew_mean          | -98.3        |
| time/                   |              |
|    fps                  | 1365         |
|    iterations           | 4301         |
|    time_elapsed         | 6449         |
|    total_timesteps      | 8808448      |
| train/                  |              |
|    approx_kl            | 0.0041006804 |
|    clip_fraction        | 0.011        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0189      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0105       |
|    n_updates            | 43000        |
|    policy_gradient_loss | 0.00722      |
|    value_loss           | 0.0226       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.9        |
|    ep_rew_mean          | -97.9       |
| time/                   |             |
|    fps                  | 1365        |
|    iterations           | 4311        |
|    time_elapsed         | 6463        |
|    total_timesteps      | 8828928     |
| train/                  |             |
|    approx_kl            | 0.031175956 |
|    clip_fraction        | 0.0143      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0176     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0161      |
|    n_updates            | 43100       |
|    policy_gradient_loss | -3.3e-06    |
|    value_loss           | 0.0216      |
-----------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 98.6    

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1366         |
|    iterations           | 4321         |
|    time_elapsed         | 6477         |
|    total_timesteps      | 8849408      |
| train/                  |              |
|    approx_kl            | 0.0029224511 |
|    clip_fraction        | 0.0192       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.026       |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | -0.00313     |
|    n_updates            | 43200        |
|    policy_gradient_loss | 0.00916      |
|    value_loss           | 0.0294       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.4         |
|    ep_rew_mean          | -97.4        |
| time/                   |              |
|    fps                  | 1366         |
|    iterations           | 4331         |
|    time_elapsed         | 6492         |
|    total_timesteps      | 8869888      |
| train/                  |              |
|    approx_kl            | 0.0020230706 |
|    clip_fraction        | 0.00615      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0159      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00522      |
|    n_updates            | 43300        |
|    policy_gradient_loss | 0.000611     |
|    value_loss           | 0.0199       |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.7         |
|    ep_rew_mean          | -97.7        |
| time/                   |              |
|    fps                  | 1366         |
|    iterations           | 4341         |
|    time_elapsed         | 6506         |
|    total_timesteps      | 8890368      |
| train/                  |              |
|    approx_kl            | 0.0005929248 |
|    clip_fraction        | 0.00884      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0151      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | -0.000349    |
|    n_updates            | 43400        |
|    policy_gradient_loss | -0.000138    |
|    value_loss           | 0.0171       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 98.4          |
|    ep_rew_mean          | -98.4         |
| time/                   |               |
|    fps                  | 1366          |
|    iterations           | 4351          |
|    time_elapsed         | 6520          |
|    total_timesteps      | 8910848       |
| train/                  |               |
|    approx_kl            | 0.00057655945 |
|    clip_fraction        | 0.00708       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.018        |
|    explained_variance   | 0.971         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.0642        |
|    n_updates            | 43500         |
|    policy_gradient_loss | 3.36e-06      |
|    value_loss           | 3.7           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 104         |
|    ep_rew_mean          | -104        |
| time/                   |             |
|    fps                  | 1366        |
|    iterations           | 4361        |
|    time_elapsed         | 6534        |
|    total_timesteps      | 8931328     |
| train/                  |             |
|    approx_kl            | 0.005401253 |
|    clip_fraction        | 0.00874     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0216     |
|    explained_variance   | 0.992       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.155       |
|    n_updates            | 43600       |
|    policy_gradient_loss | -0.0026     |
|    value_loss           | 0.784       |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 102   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4371         |
|    time_elapsed         | 6547         |
|    total_timesteps      | 8951808      |
| train/                  |              |
|    approx_kl            | 0.0017655455 |
|    clip_fraction        | 0.0137       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0296      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0108       |
|    n_updates            | 43700        |
|    policy_gradient_loss | -0.000347    |
|    value_loss           | 0.029        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.1         |
|    ep_rew_mean          | -98.1        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4381         |
|    time_elapsed         | 6561         |
|    total_timesteps      | 8972288      |
| train/                  |              |
|    approx_kl            | 0.0056836857 |
|    clip_fraction        | 0.0129       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0276      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0103       |
|    n_updates            | 43800        |
|    policy_gradient_loss | -0.00113     |
|    value_loss           | 0.0204       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.6        |
|    ep_rew_mean          | -98.6       |
| time/                   |             |
|    fps                  | 1367        |
|    iterations           | 4391        |
|    time_elapsed         | 6576        |
|    total_timesteps      | 8992768     |
| train/                  |             |
|    approx_kl            | 0.002233081 |
|    clip_fraction        | 0.0122      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0207     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0132      |
|    n_updates            | 43900       |
|    policy_gradient_loss | -0.000698   |
|    value_loss           | 0.0213      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98  

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99           |
|    ep_rew_mean          | -99          |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4401         |
|    time_elapsed         | 6590         |
|    total_timesteps      | 9013248      |
| train/                  |              |
|    approx_kl            | 0.0014032271 |
|    clip_fraction        | 0.0108       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0196      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00403      |
|    n_updates            | 44000        |
|    policy_gradient_loss | 0.00205      |
|    value_loss           | 0.0166       |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.7         |
|    ep_rew_mean          | -97.7        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4411         |
|    time_elapsed         | 6605         |
|    total_timesteps      | 9033728      |
| train/                  |              |
|    approx_kl            | 0.0031047382 |
|    clip_fraction        | 0.0145       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0287      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.014        |
|    n_updates            | 44100        |
|    policy_gradient_loss | 0.00525      |
|    value_loss           | 0.0193       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5         |
|    ep_rew_mean          | -98.5        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4421         |
|    time_elapsed         | 6620         |
|    total_timesteps      | 9054208      |
| train/                  |              |
|    approx_kl            | 0.0037857958 |
|    clip_fraction        | 0.0157       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0219      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.000814     |
|    n_updates            | 44200        |
|    policy_gradient_loss | -9.16e-05    |
|    value_loss           | 0.0178       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.6         |
|    ep_rew_mean          | -96.6        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4431         |
|    time_elapsed         | 6634         |
|    total_timesteps      | 9074688      |
| train/                  |              |
|    approx_kl            | 0.0010894911 |
|    clip_fraction        | 0.00908      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.027       |
|    explained_variance   | 0.996        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.232        |
|    n_updates            | 44300        |
|    policy_gradient_loss | -0.00186     |
|    value_loss           | 0.258        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.9         |
|    ep_rew_mean          | -99.9        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4441         |
|    time_elapsed         | 6648         |
|    total_timesteps      | 9095168      |
| train/                  |              |
|    approx_kl            | 6.353837e-05 |
|    clip_fraction        | 0.00156      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0279      |
|    explained_variance   | 0.955        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.322        |
|    n_updates            | 44400        |
|    policy_gradient_loss | 0.00104      |
|    value_loss           | 5.89         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 97.7       |
|    ep_rew_mean          | -97.7      |
| time/                   |            |
|    fps                  | 1368       |
|    iterations           | 4451       |
|    time_elapsed         | 6662       |
|    total_timesteps      | 9115648    |
| train/                  |            |
|    approx_kl            | 0.00062515 |
|    clip_fraction        | 0.00664    |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0229    |
|    explained_variance   | 0.998      |
|    learning_rate        | 0.0003     |
|    loss                 | 0.0315     |
|    n_updates            | 44500      |
|    policy_gradient_loss | 0.000224   |
|    value_loss           | 0.131      |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.9         |
|    ep_re

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101          |
|    ep_rew_mean          | -101         |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4461         |
|    time_elapsed         | 6676         |
|    total_timesteps      | 9136128      |
| train/                  |              |
|    approx_kl            | 0.0006909418 |
|    clip_fraction        | 0.00425      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0231      |
|    explained_variance   | 0.975        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.2          |
|    n_updates            | 44600        |
|    policy_gradient_loss | -0.000329    |
|    value_loss           | 2.33         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8         |
|    ep_rew_mean          | -97.8        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4471         |
|    time_elapsed         | 6693         |
|    total_timesteps      | 9156608      |
| train/                  |              |
|    approx_kl            | 0.0027968397 |
|    clip_fraction        | 0.00894      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0258      |
|    explained_variance   | 0.997        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.164        |
|    n_updates            | 44700        |
|    policy_gradient_loss | -0.000893    |
|    value_loss           | 0.216        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.4         |
|    ep_rew_mean          | -98.4        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4481         |
|    time_elapsed         | 6707         |
|    total_timesteps      | 9177088      |
| train/                  |              |
|    approx_kl            | 0.0019132362 |
|    clip_fraction        | 0.021        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0248      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00939      |
|    n_updates            | 44800        |
|    policy_gradient_loss | -0.0013      |
|    value_loss           | 0.0156       |
------------------------------------------
---------------------------------------
| rollout/                |           |
|    ep_len_mean 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 102          |
|    ep_rew_mean          | -102         |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4491         |
|    time_elapsed         | 6722         |
|    total_timesteps      | 9197568      |
| train/                  |              |
|    approx_kl            | 0.0009596186 |
|    clip_fraction        | 0.00737      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0236      |
|    explained_variance   | 0.995        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.52         |
|    n_updates            | 44900        |
|    policy_gradient_loss | 0.0012       |
|    value_loss           | 1.23         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 99.1          |
|    ep_rew_mean          | -99.1         |
| time/                   |               |
|    fps                  | 1368          |
|    iterations           | 4501          |
|    time_elapsed         | 6736          |
|    total_timesteps      | 9218048       |
| train/                  |               |
|    approx_kl            | 0.00046737932 |
|    clip_fraction        | 0.00552       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0223       |
|    explained_variance   | 0.989         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.053         |
|    n_updates            | 45000         |
|    policy_gradient_loss | -0.000504     |
|    value_loss           | 0.476         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99           |
|    ep_rew_mean          | -99          |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4511         |
|    time_elapsed         | 6750         |
|    total_timesteps      | 9238528      |
| train/                  |              |
|    approx_kl            | 0.0062258868 |
|    clip_fraction        | 0.00605      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0253      |
|    explained_variance   | 0.984        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0286       |
|    n_updates            | 45100        |
|    policy_gradient_loss | 0.00322      |
|    value_loss           | 1.62         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.2         |
|    ep_rew_mean          | -99.2        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4521         |
|    time_elapsed         | 6765         |
|    total_timesteps      | 9259008      |
| train/                  |              |
|    approx_kl            | 0.0014956183 |
|    clip_fraction        | 0.0103       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0273      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0201       |
|    n_updates            | 45200        |
|    policy_gradient_loss | 0.000621     |
|    value_loss           | 0.0491       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 103        |
|    ep_rew_mean          | -103       |
| time/                   |            |
|    fps                  | 1368       |
|    iterations           | 4531       |
|    time_elapsed         | 6779       |
|    total_timesteps      | 9279488    |
| train/                  |            |
|    approx_kl            | 0.02734239 |
|    clip_fraction        | 0.00918    |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0353    |
|    explained_variance   | 0.982      |
|    learning_rate        | 0.0003     |
|    loss                 | 0.000578   |
|    n_updates            | 45300      |
|    policy_gradient_loss | -0.00479   |
|    value_loss           | 0.798      |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 106          |
|    ep_re

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 103          |
|    ep_rew_mean          | -103         |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4541         |
|    time_elapsed         | 6793         |
|    total_timesteps      | 9299968      |
| train/                  |              |
|    approx_kl            | 0.0018525941 |
|    clip_fraction        | 0.0179       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0264      |
|    explained_variance   | 0.997        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0452       |
|    n_updates            | 45400        |
|    policy_gradient_loss | 0.00181      |
|    value_loss           | 0.151        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97           |
|    ep_rew_mean          | -97          |
| time/                   |              |
|    fps                  | 1369         |
|    iterations           | 4551         |
|    time_elapsed         | 6807         |
|    total_timesteps      | 9320448      |
| train/                  |              |
|    approx_kl            | 0.0015666699 |
|    clip_fraction        | 0.0121       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0294      |
|    explained_variance   | 0.991        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0332       |
|    n_updates            | 45500        |
|    policy_gradient_loss | 0.00028      |
|    value_loss           | 0.209        |
------------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mea

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 99.7          |
|    ep_rew_mean          | -99.7         |
| time/                   |               |
|    fps                  | 1369          |
|    iterations           | 4561          |
|    time_elapsed         | 6822          |
|    total_timesteps      | 9340928       |
| train/                  |               |
|    approx_kl            | 0.00084513763 |
|    clip_fraction        | 0.00737       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0246       |
|    explained_variance   | 0.999         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.0252        |
|    n_updates            | 45600         |
|    policy_gradient_loss | -0.00117      |
|    value_loss           | 0.118         |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 105           |
|    ep_rew_mean          | -105          |
| time/                   |               |
|    fps                  | 1369          |
|    iterations           | 4571          |
|    time_elapsed         | 6837          |
|    total_timesteps      | 9361408       |
| train/                  |               |
|    approx_kl            | 0.00097381667 |
|    clip_fraction        | 0.00469       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0222       |
|    explained_variance   | 0.984         |
|    learning_rate        | 0.0003        |
|    loss                 | 0.105         |
|    n_updates            | 45700         |
|    policy_gradient_loss | -0.00158      |
|    value_loss           | 0.61          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99          |
|    ep_rew_mean          | -99         |
| time/                   |             |
|    fps                  | 1368        |
|    iterations           | 4581        |
|    time_elapsed         | 6853        |
|    total_timesteps      | 9381888     |
| train/                  |             |
|    approx_kl            | 0.004099588 |
|    clip_fraction        | 0.0154      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0246     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.011       |
|    n_updates            | 45800       |
|    policy_gradient_loss | 0.00397     |
|    value_loss           | 0.0343      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.2  

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 113          |
|    ep_rew_mean          | -113         |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4591         |
|    time_elapsed         | 6869         |
|    total_timesteps      | 9402368      |
| train/                  |              |
|    approx_kl            | 0.0031457292 |
|    clip_fraction        | 0.0111       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0398      |
|    explained_variance   | 0.968        |
|    learning_rate        | 0.0003       |
|    loss                 | 5.97         |
|    n_updates            | 45900        |
|    policy_gradient_loss | -0.00105     |
|    value_loss           | 7.63         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.8         |
|    ep_rew_mean          | -98.8        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4601         |
|    time_elapsed         | 6884         |
|    total_timesteps      | 9422848      |
| train/                  |              |
|    approx_kl            | 0.0011839402 |
|    clip_fraction        | 0.0171       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0329      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0146       |
|    n_updates            | 46000        |
|    policy_gradient_loss | -0.0008      |
|    value_loss           | 0.0368       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3         |
|    ep_rew_mean          | -98.3        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4611         |
|    time_elapsed         | 6899         |
|    total_timesteps      | 9443328      |
| train/                  |              |
|    approx_kl            | 0.0070420923 |
|    clip_fraction        | 0.0207       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0264      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00778      |
|    n_updates            | 46100        |
|    policy_gradient_loss | -0.00038     |
|    value_loss           | 0.0289       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 99.5       |
|    ep_rew_mean          | -99.5      |
| time/                   |            |
|    fps                  | 1368       |
|    iterations           | 4621       |
|    time_elapsed         | 6915       |
|    total_timesteps      | 9463808    |
| train/                  |            |
|    approx_kl            | 0.00813271 |
|    clip_fraction        | 0.0114     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0233    |
|    explained_variance   | 0.995      |
|    learning_rate        | 0.0003     |
|    loss                 | 0.0346     |
|    n_updates            | 46200      |
|    policy_gradient_loss | -0.00133   |
|    value_loss           | 0.239      |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_re

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.8         |
|    ep_rew_mean          | -96.8        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4631         |
|    time_elapsed         | 6931         |
|    total_timesteps      | 9484288      |
| train/                  |              |
|    approx_kl            | 0.0043430864 |
|    clip_fraction        | 0.0141       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0207      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0138       |
|    n_updates            | 46300        |
|    policy_gradient_loss | -0.000151    |
|    value_loss           | 0.0602       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.3        |
|    ep_rew_mean          | -99.3       |
| time/                   |             |
|    fps                  | 1368        |
|    iterations           | 4641        |
|    time_elapsed         | 6947        |
|    total_timesteps      | 9504768     |
| train/                  |             |
|    approx_kl            | 0.003252834 |
|    clip_fraction        | 0.0156      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0256     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0145      |
|    n_updates            | 46400       |
|    policy_gradient_loss | -0.0021     |
|    value_loss           | 0.0216      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.2         |
|    ep_rew_mean          | -99.2        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4651         |
|    time_elapsed         | 6963         |
|    total_timesteps      | 9525248      |
| train/                  |              |
|    approx_kl            | 0.0030915546 |
|    clip_fraction        | 0.0118       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0205      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0107       |
|    n_updates            | 46500        |
|    policy_gradient_loss | -0.00133     |
|    value_loss           | 0.043        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5         |
|    ep_rew_mean          | -98.5        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4661         |
|    time_elapsed         | 6979         |
|    total_timesteps      | 9545728      |
| train/                  |              |
|    approx_kl            | 0.0012517233 |
|    clip_fraction        | 0.0123       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0217      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.013        |
|    n_updates            | 46600        |
|    policy_gradient_loss | 0.00249      |
|    value_loss           | 0.0283       |
------------------------------------------
---------------------------------------
| rollout/                |           |
|    ep_len_mean 

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 102         |
|    ep_rew_mean          | -102        |
| time/                   |             |
|    fps                  | 1367        |
|    iterations           | 4671        |
|    time_elapsed         | 6994        |
|    total_timesteps      | 9566208     |
| train/                  |             |
|    approx_kl            | 0.001151594 |
|    clip_fraction        | 0.0107      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0265     |
|    explained_variance   | 0.981       |
|    learning_rate        | 0.0003      |
|    loss                 | 1.64        |
|    n_updates            | 46700       |
|    policy_gradient_loss | -0.00165    |
|    value_loss           | 4.68        |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 101   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.7         |
|    ep_rew_mean          | -98.7        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4681         |
|    time_elapsed         | 7010         |
|    total_timesteps      | 9586688      |
| train/                  |              |
|    approx_kl            | 0.0010258993 |
|    clip_fraction        | 0.00913      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0253      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0159       |
|    n_updates            | 46800        |
|    policy_gradient_loss | 0.000482     |
|    value_loss           | 0.0241       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4691         |
|    time_elapsed         | 7025         |
|    total_timesteps      | 9607168      |
| train/                  |              |
|    approx_kl            | 0.0017215565 |
|    clip_fraction        | 0.0148       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0192      |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.016        |
|    n_updates            | 46900        |
|    policy_gradient_loss | -0.000852    |
|    value_loss           | 0.0407       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 99.5        |
|    ep_rew_mean          | -99.5       |
| time/                   |             |
|    fps                  | 1367        |
|    iterations           | 4701        |
|    time_elapsed         | 7039        |
|    total_timesteps      | 9627648     |
| train/                  |             |
|    approx_kl            | 0.022410704 |
|    clip_fraction        | 0.01        |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0228     |
|    explained_variance   | 0.988       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.064       |
|    n_updates            | 47000       |
|    policy_gradient_loss | 0.000841    |
|    value_loss           | 0.732       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 101 

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.4        |
|    ep_rew_mean          | -97.4       |
| time/                   |             |
|    fps                  | 1367        |
|    iterations           | 4711        |
|    time_elapsed         | 7054        |
|    total_timesteps      | 9648128     |
| train/                  |             |
|    approx_kl            | 0.004017213 |
|    clip_fraction        | 0.0153      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0212     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0179      |
|    n_updates            | 47100       |
|    policy_gradient_loss | 0.0016      |
|    value_loss           | 0.0582      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.5

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 102        |
|    ep_rew_mean          | -102       |
| time/                   |            |
|    fps                  | 1367       |
|    iterations           | 4721       |
|    time_elapsed         | 7070       |
|    total_timesteps      | 9668608    |
| train/                  |            |
|    approx_kl            | 0.11828356 |
|    clip_fraction        | 0.0235     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.0415    |
|    explained_variance   | 1          |
|    learning_rate        | 0.0003     |
|    loss                 | 0.00387    |
|    n_updates            | 47200      |
|    policy_gradient_loss | -0.00365   |
|    value_loss           | 0.0208     |
----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 106           |
|    ep

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 110           |
|    ep_rew_mean          | -110          |
| time/                   |               |
|    fps                  | 1367          |
|    iterations           | 4731          |
|    time_elapsed         | 7084          |
|    total_timesteps      | 9689088       |
| train/                  |               |
|    approx_kl            | 0.00088496855 |
|    clip_fraction        | 0.00835       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0415       |
|    explained_variance   | 0.97          |
|    learning_rate        | 0.0003        |
|    loss                 | 2.36          |
|    n_updates            | 47300         |
|    policy_gradient_loss | -0.000263     |
|    value_loss           | 6.62          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100         |
|    ep_rew_mean          | -100        |
| time/                   |             |
|    fps                  | 1367        |
|    iterations           | 4741        |
|    time_elapsed         | 7098        |
|    total_timesteps      | 9709568     |
| train/                  |             |
|    approx_kl            | 0.005422976 |
|    clip_fraction        | 0.0173      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0532     |
|    explained_variance   | 0.999       |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0365      |
|    n_updates            | 47400       |
|    policy_gradient_loss | 0.000416    |
|    value_loss           | 0.08        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.6

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.1         |
|    ep_rew_mean          | -98.1        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4751         |
|    time_elapsed         | 7112         |
|    total_timesteps      | 9730048      |
| train/                  |              |
|    approx_kl            | 0.0014891075 |
|    clip_fraction        | 0.00615      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0228      |
|    explained_variance   | 0.986        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0479       |
|    n_updates            | 47500        |
|    policy_gradient_loss | -0.00107     |
|    value_loss           | 0.497        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.1         |
|    ep_rew_mean          | -97.1        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4761         |
|    time_elapsed         | 7126         |
|    total_timesteps      | 9750528      |
| train/                  |              |
|    approx_kl            | 0.0013213172 |
|    clip_fraction        | 0.0101       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0195      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00823      |
|    n_updates            | 47600        |
|    policy_gradient_loss | -0.000124    |
|    value_loss           | 0.0229       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.7         |
|    ep_rew_mean          | -96.7        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4771         |
|    time_elapsed         | 7141         |
|    total_timesteps      | 9771008      |
| train/                  |              |
|    approx_kl            | 0.0017494243 |
|    clip_fraction        | 0.0132       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.02        |
|    explained_variance   | 0.999        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0281       |
|    n_updates            | 47700        |
|    policy_gradient_loss | -0.00132     |
|    value_loss           | 0.0973       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 99.1         |
|    ep_rew_mean          | -99.1        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4781         |
|    time_elapsed         | 7157         |
|    total_timesteps      | 9791488      |
| train/                  |              |
|    approx_kl            | 0.0008301893 |
|    clip_fraction        | 0.00889      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0243      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.00289      |
|    n_updates            | 47800        |
|    policy_gradient_loss | 0.0017       |
|    value_loss           | 0.025        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.7         |
|    ep_rew_mean          | -97.7        |
| time/                   |              |
|    fps                  | 1367         |
|    iterations           | 4791         |
|    time_elapsed         | 7173         |
|    total_timesteps      | 9811968      |
| train/                  |              |
|    approx_kl            | 0.0013524925 |
|    clip_fraction        | 0.00879      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0188      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.009        |
|    n_updates            | 47900        |
|    policy_gradient_loss | -8.04e-05    |
|    value_loss           | 0.0207       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.5         |
|    ep_rew_mean          | -98.5        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4801         |
|    time_elapsed         | 7187         |
|    total_timesteps      | 9832448      |
| train/                  |              |
|    approx_kl            | 0.0013273365 |
|    clip_fraction        | 0.00903      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0214      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0139       |
|    n_updates            | 48000        |
|    policy_gradient_loss | -0.000517    |
|    value_loss           | 0.0199       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 97.8         |
|    ep_rew_mean          | -97.8        |
| time/                   |              |
|    fps                  | 1368         |
|    iterations           | 4811         |
|    time_elapsed         | 7201         |
|    total_timesteps      | 9852928      |
| train/                  |              |
|    approx_kl            | 0.0029541508 |
|    clip_fraction        | 0.0172       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0311      |
|    explained_variance   | 1            |
|    learning_rate        | 0.0003       |
|    loss                 | 0.0198       |
|    n_updates            | 48100        |
|    policy_gradient_loss | 0.012        |
|    value_loss           | 0.0242       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98          |
|    ep_rew_mean          | -98         |
| time/                   |             |
|    fps                  | 1368        |
|    iterations           | 4821        |
|    time_elapsed         | 7215        |
|    total_timesteps      | 9873408     |
| train/                  |             |
|    approx_kl            | 0.006431275 |
|    clip_fraction        | 0.0121      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0201     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00204     |
|    n_updates            | 48200       |
|    policy_gradient_loss | -0.00173    |
|    value_loss           | 0.0148      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.2

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.8        |
|    ep_rew_mean          | -98.8       |
| time/                   |             |
|    fps                  | 1368        |
|    iterations           | 4831        |
|    time_elapsed         | 7229        |
|    total_timesteps      | 9893888     |
| train/                  |             |
|    approx_kl            | 0.035536855 |
|    clip_fraction        | 0.0219      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0226     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0027      |
|    n_updates            | 48300       |
|    policy_gradient_loss | 0.057       |
|    value_loss           | 0.0226      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 98.3

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.4        |
|    ep_rew_mean          | -98.4       |
| time/                   |             |
|    fps                  | 1368        |
|    iterations           | 4841        |
|    time_elapsed         | 7243        |
|    total_timesteps      | 9914368     |
| train/                  |             |
|    approx_kl            | 0.007531444 |
|    clip_fraction        | 0.0246      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0332     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0119      |
|    n_updates            | 48400       |
|    policy_gradient_loss | -0.00201    |
|    value_loss           | 0.0205      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.7  

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.5        |
|    ep_rew_mean          | -97.5       |
| time/                   |             |
|    fps                  | 1368        |
|    iterations           | 4851        |
|    time_elapsed         | 7257        |
|    total_timesteps      | 9934848     |
| train/                  |             |
|    approx_kl            | 0.006360907 |
|    clip_fraction        | 0.0165      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0188     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00391     |
|    n_updates            | 48500       |
|    policy_gradient_loss | -0.00308    |
|    value_loss           | 0.0227      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 96.5

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 100          |
|    ep_rew_mean          | -100         |
| time/                   |              |
|    fps                  | 1369         |
|    iterations           | 4861         |
|    time_elapsed         | 7271         |
|    total_timesteps      | 9955328      |
| train/                  |              |
|    approx_kl            | 0.0044783805 |
|    clip_fraction        | 0.0101       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0212      |
|    explained_variance   | 0.996        |
|    learning_rate        | 0.0003       |
|    loss                 | 0.235        |
|    n_updates            | 48600        |
|    policy_gradient_loss | 0.000827     |
|    value_loss           | 0.426        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 97.8        |
|    ep_rew_mean          | -97.8       |
| time/                   |             |
|    fps                  | 1368        |
|    iterations           | 4871        |
|    time_elapsed         | 7288        |
|    total_timesteps      | 9975808     |
| train/                  |             |
|    approx_kl            | 0.002155738 |
|    clip_fraction        | 0.0117      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0215     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.0106      |
|    n_updates            | 48700       |
|    policy_gradient_loss | 0.00392     |
|    value_loss           | 0.0287      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 97

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 98.6        |
|    ep_rew_mean          | -98.6       |
| time/                   |             |
|    fps                  | 1368        |
|    iterations           | 4881        |
|    time_elapsed         | 7303        |
|    total_timesteps      | 9996288     |
| train/                  |             |
|    approx_kl            | 0.122409254 |
|    clip_fraction        | 0.0429      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.0274     |
|    explained_variance   | 1           |
|    learning_rate        | 0.0003      |
|    loss                 | 0.00211     |
|    n_updates            | 48800       |
|    policy_gradient_loss | -0.0105     |
|    value_loss           | 0.0316      |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 100   

In [6]:
model_name = f"{algorithm_name}_{environment_name}_{number_of_episodes}"
Algorithm_Path = os.path.join('Training', 'Saved Models', model_name)
#Algorithm_Path = os.path.join('Training', 'Saved Models', 'PPO_CartPole-v1_10000')
model.save(Algorithm_Path)

In [14]:
episodes = 50
scores = []
for episode in range(1, episodes+1):
    obs = env.reset()
    done = False
    score = 0
    
    while not done:
        
        #env.render()
        action, _ = model.predict(obs) # WE ARE NOW USING OUR MODEL
        obs, reward, done, info = env.step(action)
        score += reward
    
    print('Episode:{} Score:{}'.format(episode, score))
    scores.append(score)
    
env.close()


mean_score = sum(scores) / len(scores)
std_dev = (sum((score - mean_score)**2 for score in scores) / len(scores))**0.5

print(f"Mean Score: {mean_score}")
print(f"Standard Deviation: {std_dev}")



#del model

Episode:1 Score:[-83.]
Episode:2 Score:[-103.]
Episode:3 Score:[-83.]
Episode:4 Score:[-94.]
Episode:5 Score:[-87.]
Episode:6 Score:[-104.]
Episode:7 Score:[-104.]
Episode:8 Score:[-101.]
Episode:9 Score:[-105.]
Episode:10 Score:[-85.]
Episode:11 Score:[-85.]
Episode:12 Score:[-103.]
Episode:13 Score:[-83.]
Episode:14 Score:[-84.]
Episode:15 Score:[-103.]
Episode:16 Score:[-111.]
Episode:17 Score:[-165.]
Episode:18 Score:[-103.]
Episode:19 Score:[-162.]
Episode:20 Score:[-103.]
Episode:21 Score:[-103.]
Episode:22 Score:[-104.]
Episode:23 Score:[-86.]
Episode:24 Score:[-110.]
Episode:25 Score:[-103.]
Episode:26 Score:[-89.]
Episode:27 Score:[-104.]
Episode:28 Score:[-87.]
Episode:29 Score:[-94.]
Episode:30 Score:[-86.]
Episode:31 Score:[-103.]
Episode:32 Score:[-94.]
Episode:33 Score:[-103.]
Episode:34 Score:[-103.]
Episode:35 Score:[-103.]
Episode:36 Score:[-103.]
Episode:37 Score:[-103.]
Episode:38 Score:[-103.]
Episode:39 Score:[-85.]
Episode:40 Score:[-102.]
Episode:41 Score:[-103.]

In [11]:
#del model