## Train Model

In [13]:
import os
import logging
from datetime import datetime
from stable_baselines3 import PPO
from stable_baselines3.common.callbacks import BaseCallback
# Import the sb3 monitor for logging 
from stable_baselines3.common.monitor import Monitor
logger = logging.getLogger()
logger.setLevel(logging.INFO)

from carla_env import CarlaWalkerEnv, read_IP_from_file

env = CarlaWalkerEnv(verbose=False, host=read_IP_from_file(file_name='../ip-host.txt'))
env.max_tick_count = 20*60
env = Monitor(env)

INFO:root:Map Carla/Maps/Town01 loaded


IP: 137.250.121.29


In [14]:
print('Date and time:', datetime.now().strftime('%Y-%m-%d_%H%M'))

Date and time: 2022-03-03_1145


### Train Callback

In [15]:
class TrainAndLoggingCallback(BaseCallback):
    
    def __init__(self, check_freq, save_path, verbose=1):
        super(TrainAndLoggingCallback, self).__init__(verbose)
        self.check_freq = check_freq
        self.save_path = save_path
        
    def _init_callback(self):
        if self.save_path is not None:
            os.makedirs(self.save_path, exist_ok = True)
            
    def _on_step(self):
        if self.n_calls % self.check_freq == 0:
            model_path = os.path.join(self.save_path, 'best_model_{}'.format(self.n_calls))
            self.model.save(model_path)
            
        return True

In [16]:
# from stable_baselines3 import PPO
# # Bring in the eval policy method for metric calculation
# from stable_baselines3.common.evaluation import evaluate_policy

now = datetime.now().strftime('%Y-%m-%d_%H%M')

LOG_DIR = './tmp/train/logs/' + now + '/'
OPT_DIR = './tmp/train/opt/' + now + '/'

SAVE_PATH = os.path.join(OPT_DIR, 'trial_{}_best_model'.format(1))

model = PPO(
    'MlpPolicy',
    env,
    tensorboard_log=LOG_DIR,
    verbose=1,
    # **model_params
)
# model.learn(total_timesteps=100_000)
model.learn(
    total_timesteps=600_000, 
    callback=TrainAndLoggingCallback(
        check_freq=10_000, 
        save_path=LOG_DIR
        )
    )

env.close()


Using cuda device
Wrapping the env in a DummyVecEnv.
Logging to ./tmp/train/logs/2022-03-03_1145/PPO_1


INFO:root:done


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1.2e+03  |
|    ep_rew_mean     | 1.16e+04 |
| time/              |          |
|    fps             | 161      |
|    iterations      | 1        |
|    time_elapsed    | 12       |
|    total_timesteps | 2048     |
---------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.17e+04    |
| time/                   |             |
|    fps                  | 152         |
|    iterations           | 2           |
|    time_elapsed         | 26          |
|    total_timesteps      | 4096        |
| train/                  |             |
|    approx_kl            | 0.004391538 |
|    clip_fraction        | 0.0325      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.85       |
|    explained_variance   | -0.0039     |
|    learning_rate        | 0.0003      |
|    loss                 | 1.11e+04    |
|    n_updates            | 10          |
|    policy_gradient_loss | -0.0065     |
|    std                  | 1.01        |
|    value_loss           | 2.29e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.2e+04      |
| time/                   |              |
|    fps                  | 148          |
|    iterations           | 3            |
|    time_elapsed         | 41           |
|    total_timesteps      | 6144         |
| train/                  |              |
|    approx_kl            | 0.0032937697 |
|    clip_fraction        | 0.0124       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.84        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 1.18e+04     |
|    n_updates            | 20           |
|    policy_gradient_loss | -0.00566     |
|    std                  | 0.999        |
|    value_loss           | 2.46e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.21e+04    |
| time/                   |             |
|    fps                  | 148         |
|    iterations           | 4           |
|    time_elapsed         | 55          |
|    total_timesteps      | 8192        |
| train/                  |             |
|    approx_kl            | 0.005230262 |
|    clip_fraction        | 0.0339      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.83       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.32e+04    |
|    n_updates            | 30          |
|    policy_gradient_loss | -0.00683    |
|    std                  | 0.995       |
|    value_loss           | 2.72e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.23e+04     |
| time/                   |              |
|    fps                  | 148          |
|    iterations           | 5            |
|    time_elapsed         | 69           |
|    total_timesteps      | 10240        |
| train/                  |              |
|    approx_kl            | 0.0058952486 |
|    clip_fraction        | 0.0416       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.82        |
|    explained_variance   | 5.6e-06      |
|    learning_rate        | 0.0003       |
|    loss                 | 1.33e+04     |
|    n_updates            | 40           |
|    policy_gradient_loss | -0.0103      |
|    std                  | 0.992        |
|    value_loss           | 2.78e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.23e+04     |
| time/                   |              |
|    fps                  | 147          |
|    iterations           | 6            |
|    time_elapsed         | 83           |
|    total_timesteps      | 12288        |
| train/                  |              |
|    approx_kl            | 0.0054528527 |
|    clip_fraction        | 0.0701       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.83        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.32e+04     |
|    n_updates            | 50           |
|    policy_gradient_loss | -0.00763     |
|    std                  | 0.997        |
|    value_loss           | 2.84e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.24e+04     |
| time/                   |              |
|    fps                  | 147          |
|    iterations           | 7            |
|    time_elapsed         | 97           |
|    total_timesteps      | 14336        |
| train/                  |              |
|    approx_kl            | 0.0056882296 |
|    clip_fraction        | 0.0507       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.82        |
|    explained_variance   | -8.34e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.34e+04     |
|    n_updates            | 60           |
|    policy_gradient_loss | -0.0167      |
|    std                  | 0.992        |
|    value_loss           | 2.68e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.26e+04    |
| time/                   |             |
|    fps                  | 147         |
|    iterations           | 8           |
|    time_elapsed         | 110         |
|    total_timesteps      | 16384       |
| train/                  |             |
|    approx_kl            | 0.005596227 |
|    clip_fraction        | 0.0539      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.82       |
|    explained_variance   | 1.07e-06    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.56e+04    |
|    n_updates            | 70          |
|    policy_gradient_loss | -0.00549    |
|    std                  | 0.994       |
|    value_loss           | 3.32e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.28e+04    |
| time/                   |             |
|    fps                  | 147         |
|    iterations           | 9           |
|    time_elapsed         | 124         |
|    total_timesteps      | 18432       |
| train/                  |             |
|    approx_kl            | 0.008129839 |
|    clip_fraction        | 0.0799      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.83       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.31e+04    |
|    n_updates            | 80          |
|    policy_gradient_loss | -0.00546    |
|    std                  | 1           |
|    value_loss           | 2.93e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.28e+04     |
| time/                   |              |
|    fps                  | 147          |
|    iterations           | 10           |
|    time_elapsed         | 138          |
|    total_timesteps      | 20480        |
| train/                  |              |
|    approx_kl            | 0.0076107667 |
|    clip_fraction        | 0.069        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.83        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.51e+04     |
|    n_updates            | 90           |
|    policy_gradient_loss | -0.023       |
|    std                  | 0.99         |
|    value_loss           | 3.23e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.29e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 11          |
|    time_elapsed         | 153         |
|    total_timesteps      | 22528       |
| train/                  |             |
|    approx_kl            | 0.011042925 |
|    clip_fraction        | 0.136       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.8        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.48e+04    |
|    n_updates            | 100         |
|    policy_gradient_loss | -0.0137     |
|    std                  | 0.979       |
|    value_loss           | 3.05e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.31e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 12         |
|    time_elapsed         | 167        |
|    total_timesteps      | 24576      |
| train/                  |            |
|    approx_kl            | 0.01359958 |
|    clip_fraction        | 0.144      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.78      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 1.54e+04   |
|    n_updates            | 110        |
|    policy_gradient_loss | -0.00544   |
|    std                  | 0.969      |
|    value_loss           | 3.27e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.32e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 13          |
|    time_elapsed         | 182         |
|    total_timesteps      | 26624       |
| train/                  |             |
|    approx_kl            | 0.004331241 |
|    clip_fraction        | 0.0518      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.77       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.67e+04    |
|    n_updates            | 120         |
|    policy_gradient_loss | -0.00361    |
|    std                  | 0.962       |
|    value_loss           | 3.36e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.32e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 14          |
|    time_elapsed         | 195         |
|    total_timesteps      | 28672       |
| train/                  |             |
|    approx_kl            | 0.008661566 |
|    clip_fraction        | 0.136       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.77       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.64e+04    |
|    n_updates            | 130         |
|    policy_gradient_loss | -0.0107     |
|    std                  | 0.967       |
|    value_loss           | 3.51e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.33e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 15          |
|    time_elapsed         | 209         |
|    total_timesteps      | 30720       |
| train/                  |             |
|    approx_kl            | 0.008165269 |
|    clip_fraction        | 0.0993      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.77       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.62e+04    |
|    n_updates            | 140         |
|    policy_gradient_loss | -0.00909    |
|    std                  | 0.967       |
|    value_loss           | 3.1e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.34e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 16          |
|    time_elapsed         | 223         |
|    total_timesteps      | 32768       |
| train/                  |             |
|    approx_kl            | 0.010763007 |
|    clip_fraction        | 0.116       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.77       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.46e+04    |
|    n_updates            | 150         |
|    policy_gradient_loss | -0.00913    |
|    std                  | 0.965       |
|    value_loss           | 3.02e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 17          |
|    time_elapsed         | 236         |
|    total_timesteps      | 34816       |
| train/                  |             |
|    approx_kl            | 0.010309635 |
|    clip_fraction        | 0.097       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.76       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.79e+04    |
|    n_updates            | 160         |
|    policy_gradient_loss | -0.016      |
|    std                  | 0.963       |
|    value_loss           | 3.72e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 18          |
|    time_elapsed         | 251         |
|    total_timesteps      | 36864       |
| train/                  |             |
|    approx_kl            | 0.010238191 |
|    clip_fraction        | 0.126       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.75       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.82e+04    |
|    n_updates            | 170         |
|    policy_gradient_loss | -0.0178     |
|    std                  | 0.952       |
|    value_loss           | 3.62e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.36e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 19          |
|    time_elapsed         | 265         |
|    total_timesteps      | 38912       |
| train/                  |             |
|    approx_kl            | 0.010769315 |
|    clip_fraction        | 0.113       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.73       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.38e+04    |
|    n_updates            | 180         |
|    policy_gradient_loss | -0.0116     |
|    std                  | 0.94        |
|    value_loss           | 3e+04       |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.36e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 20          |
|    time_elapsed         | 279         |
|    total_timesteps      | 40960       |
| train/                  |             |
|    approx_kl            | 0.011145861 |
|    clip_fraction        | 0.105       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.7        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.42e+04    |
|    n_updates            | 190         |
|    policy_gradient_loss | -0.0263     |
|    std                  | 0.923       |
|    value_loss           | 2.97e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.37e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 21          |
|    time_elapsed         | 293         |
|    total_timesteps      | 43008       |
| train/                  |             |
|    approx_kl            | 0.015250875 |
|    clip_fraction        | 0.136       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.66       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.64e+04    |
|    n_updates            | 200         |
|    policy_gradient_loss | -0.0171     |
|    std                  | 0.904       |
|    value_loss           | 3.27e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.37e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 22         |
|    time_elapsed         | 307        |
|    total_timesteps      | 45056      |
| train/                  |            |
|    approx_kl            | 0.01354915 |
|    clip_fraction        | 0.162      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.64      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 1.78e+04   |
|    n_updates            | 210        |
|    policy_gradient_loss | -0.00339   |
|    std                  | 0.905      |
|    value_loss           | 3.64e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.38e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 23          |
|    time_elapsed         | 321         |
|    total_timesteps      | 47104       |
| train/                  |             |
|    approx_kl            | 0.011652257 |
|    clip_fraction        | 0.152       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.39e+04    |
|    n_updates            | 220         |
|    policy_gradient_loss | -0.00208    |
|    std                  | 0.897       |
|    value_loss           | 2.98e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.39e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 24          |
|    time_elapsed         | 335         |
|    total_timesteps      | 49152       |
| train/                  |             |
|    approx_kl            | 0.008541563 |
|    clip_fraction        | 0.0871      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.72e+04    |
|    n_updates            | 230         |
|    policy_gradient_loss | -0.0154     |
|    std                  | 0.906       |
|    value_loss           | 3.31e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.4e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 25          |
|    time_elapsed         | 349         |
|    total_timesteps      | 51200       |
| train/                  |             |
|    approx_kl            | 0.009695856 |
|    clip_fraction        | 0.0991      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.64       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 3.03e+04    |
|    n_updates            | 240         |
|    policy_gradient_loss | -0.0225     |
|    std                  | 0.904       |
|    value_loss           | 5.91e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.41e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 26          |
|    time_elapsed         | 363         |
|    total_timesteps      | 53248       |
| train/                  |             |
|    approx_kl            | 0.016079355 |
|    clip_fraction        | 0.22        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.64       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.34e+04    |
|    n_updates            | 250         |
|    policy_gradient_loss | -0.0105     |
|    std                  | 0.903       |
|    value_loss           | 2.8e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.41e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 27          |
|    time_elapsed         | 377         |
|    total_timesteps      | 55296       |
| train/                  |             |
|    approx_kl            | 0.012627118 |
|    clip_fraction        | 0.132       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.99e+04    |
|    n_updates            | 260         |
|    policy_gradient_loss | -0.00803    |
|    std                  | 0.901       |
|    value_loss           | 4.56e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.42e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 28          |
|    time_elapsed         | 391         |
|    total_timesteps      | 57344       |
| train/                  |             |
|    approx_kl            | 0.014936594 |
|    clip_fraction        | 0.179       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.19e+04    |
|    n_updates            | 270         |
|    policy_gradient_loss | -0.00363    |
|    std                  | 0.901       |
|    value_loss           | 2.54e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.43e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 29          |
|    time_elapsed         | 405         |
|    total_timesteps      | 59392       |
| train/                  |             |
|    approx_kl            | 0.013621929 |
|    clip_fraction        | 0.139       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.87e+04    |
|    n_updates            | 280         |
|    policy_gradient_loss | -0.0116     |
|    std                  | 0.903       |
|    value_loss           | 5.49e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.46e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 30          |
|    time_elapsed         | 419         |
|    total_timesteps      | 61440       |
| train/                  |             |
|    approx_kl            | 0.014553876 |
|    clip_fraction        | 0.218       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.18e+04    |
|    n_updates            | 290         |
|    policy_gradient_loss | 0.00823     |
|    std                  | 0.9         |
|    value_loss           | 4.42e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.47e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 31          |
|    time_elapsed         | 433         |
|    total_timesteps      | 63488       |
| train/                  |             |
|    approx_kl            | 0.007278528 |
|    clip_fraction        | 0.09        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.62       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.93e+04    |
|    n_updates            | 300         |
|    policy_gradient_loss | -0.00995    |
|    std                  | 0.895       |
|    value_loss           | 7.37e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.48e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 32         |
|    time_elapsed         | 447        |
|    total_timesteps      | 65536      |
| train/                  |            |
|    approx_kl            | 0.01160966 |
|    clip_fraction        | 0.128      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.61      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 3.16e+04   |
|    n_updates            | 310        |
|    policy_gradient_loss | -0.00724   |
|    std                  | 0.894      |
|    value_loss           | 6.29e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.5e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 33          |
|    time_elapsed         | 461         |
|    total_timesteps      | 67584       |
| train/                  |             |
|    approx_kl            | 0.018593464 |
|    clip_fraction        | 0.14        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.62       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.96e+04    |
|    n_updates            | 320         |
|    policy_gradient_loss | -0.0151     |
|    std                  | 0.895       |
|    value_loss           | 3.84e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 1.2e+03   |
|    ep_rew_mean          | 1.51e+04  |
| time/                   |           |
|    fps                  | 146       |
|    iterations           | 34        |
|    time_elapsed         | 475       |
|    total_timesteps      | 69632     |
| train/                  |           |
|    approx_kl            | 0.0150782 |
|    clip_fraction        | 0.151     |
|    clip_range           | 0.2       |
|    entropy_loss         | -2.62     |
|    explained_variance   | 0         |
|    learning_rate        | 0.0003    |
|    loss                 | 3.27e+04  |
|    n_updates            | 330       |
|    policy_gradient_loss | -0.0103   |
|    std                  | 0.894     |
|    value_loss           | 6.71e+04  |
---------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.51e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 35           |
|    time_elapsed         | 489          |
|    total_timesteps      | 71680        |
| train/                  |              |
|    approx_kl            | 0.0122095235 |
|    clip_fraction        | 0.136        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.62        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.19e+04     |
|    n_updates            | 340          |
|    policy_gradient_loss | -0.00897     |
|    std                  | 0.893        |
|    value_loss           | 4.53e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.54e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 36          |
|    time_elapsed         | 503         |
|    total_timesteps      | 73728       |
| train/                  |             |
|    approx_kl            | 0.007932127 |
|    clip_fraction        | 0.0719      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.61       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.45e+04    |
|    n_updates            | 350         |
|    policy_gradient_loss | -0.00412    |
|    std                  | 0.893       |
|    value_loss           | 5.21e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.54e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 37          |
|    time_elapsed         | 517         |
|    total_timesteps      | 75776       |
| train/                  |             |
|    approx_kl            | 0.013687752 |
|    clip_fraction        | 0.148       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.62       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.75e+04    |
|    n_updates            | 360         |
|    policy_gradient_loss | -0.00648    |
|    std                  | 0.901       |
|    value_loss           | 7.21e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.54e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 38          |
|    time_elapsed         | 531         |
|    total_timesteps      | 77824       |
| train/                  |             |
|    approx_kl            | 0.019635525 |
|    clip_fraction        | 0.196       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.62       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.77e+04    |
|    n_updates            | 370         |
|    policy_gradient_loss | -0.00608    |
|    std                  | 0.894       |
|    value_loss           | 3.67e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.55e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 39          |
|    time_elapsed         | 545         |
|    total_timesteps      | 79872       |
| train/                  |             |
|    approx_kl            | 0.014820069 |
|    clip_fraction        | 0.152       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.6        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.49e+04    |
|    n_updates            | 380         |
|    policy_gradient_loss | -0.0325     |
|    std                  | 0.884       |
|    value_loss           | 3.3e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.55e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 40          |
|    time_elapsed         | 559         |
|    total_timesteps      | 81920       |
| train/                  |             |
|    approx_kl            | 0.023059068 |
|    clip_fraction        | 0.237       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.59       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.74e+04    |
|    n_updates            | 390         |
|    policy_gradient_loss | -0.000467   |
|    std                  | 0.881       |
|    value_loss           | 4.08e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.55e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 41          |
|    time_elapsed         | 573         |
|    total_timesteps      | 83968       |
| train/                  |             |
|    approx_kl            | 0.018831586 |
|    clip_fraction        | 0.169       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.58       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.04e+04    |
|    n_updates            | 400         |
|    policy_gradient_loss | -0.0248     |
|    std                  | 0.872       |
|    value_loss           | 4.24e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.56e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 42          |
|    time_elapsed         | 587         |
|    total_timesteps      | 86016       |
| train/                  |             |
|    approx_kl            | 0.023009354 |
|    clip_fraction        | 0.213       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.57       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.63e+04    |
|    n_updates            | 410         |
|    policy_gradient_loss | 0.00402     |
|    std                  | 0.876       |
|    value_loss           | 5.39e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.58e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 43          |
|    time_elapsed         | 601         |
|    total_timesteps      | 88064       |
| train/                  |             |
|    approx_kl            | 0.012054702 |
|    clip_fraction        | 0.149       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.56       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.72e+04    |
|    n_updates            | 420         |
|    policy_gradient_loss | -0.00522    |
|    std                  | 0.866       |
|    value_loss           | 5.18e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.59e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 44          |
|    time_elapsed         | 615         |
|    total_timesteps      | 90112       |
| train/                  |             |
|    approx_kl            | 0.018233374 |
|    clip_fraction        | 0.146       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.54       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 4.14e+04    |
|    n_updates            | 430         |
|    policy_gradient_loss | -0.00968    |
|    std                  | 0.854       |
|    value_loss           | 7.75e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.69e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 45          |
|    time_elapsed         | 629         |
|    total_timesteps      | 92160       |
| train/                  |             |
|    approx_kl            | 0.030004544 |
|    clip_fraction        | 0.289       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.52       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.45e+04    |
|    n_updates            | 440         |
|    policy_gradient_loss | 0.00773     |
|    std                  | 0.856       |
|    value_loss           | 4.6e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.7e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 46           |
|    time_elapsed         | 643          |
|    total_timesteps      | 94208        |
| train/                  |              |
|    approx_kl            | 0.0057585663 |
|    clip_fraction        | 0.0339       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.52        |
|    explained_variance   | -2.38e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.04e+06     |
|    n_updates            | 450          |
|    policy_gradient_loss | -0.00344     |
|    std                  | 0.851        |
|    value_loss           | 3.83e+06     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.7e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 47           |
|    time_elapsed         | 656          |
|    total_timesteps      | 96256        |
| train/                  |              |
|    approx_kl            | 0.0145547455 |
|    clip_fraction        | 0.131        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.49        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.97e+04     |
|    n_updates            | 460          |
|    policy_gradient_loss | -0.0207      |
|    std                  | 0.832        |
|    value_loss           | 4.46e+04     |
------------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.7e+04    |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 48         |
|    time_elapsed         | 670        |
|    total_timesteps      | 98304      |
| train/                  |            |
|    approx_kl            | 0.02108854 |
|    clip_fraction        | 0.216      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.47      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 2.17e+04   |
|    n_updates            | 470        |
|    policy_gradient_loss | -0.000534  |
|    std                  | 0.836      |
|    value_loss           | 4.14e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.7e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 49          |
|    time_elapsed         | 685         |
|    total_timesteps      | 100352      |
| train/                  |             |
|    approx_kl            | 0.021511838 |
|    clip_fraction        | 0.235       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.84e+04    |
|    n_updates            | 480         |
|    policy_gradient_loss | 0.00179     |
|    std                  | 0.835       |
|    value_loss           | 3.83e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.71e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 50          |
|    time_elapsed         | 699         |
|    total_timesteps      | 102400      |
| train/                  |             |
|    approx_kl            | 0.022287574 |
|    clip_fraction        | 0.247       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.49       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.49e+04    |
|    n_updates            | 490         |
|    policy_gradient_loss | 0.00136     |
|    std                  | 0.842       |
|    value_loss           | 3.27e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.71e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 51          |
|    time_elapsed         | 713         |
|    total_timesteps      | 104448      |
| train/                  |             |
|    approx_kl            | 0.009410672 |
|    clip_fraction        | 0.0986      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.49       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 3.92e+04    |
|    n_updates            | 500         |
|    policy_gradient_loss | -0.00541    |
|    std                  | 0.836       |
|    value_loss           | 6.97e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.71e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 52          |
|    time_elapsed         | 727         |
|    total_timesteps      | 106496      |
| train/                  |             |
|    approx_kl            | 0.018075552 |
|    clip_fraction        | 0.198       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.55e+04    |
|    n_updates            | 510         |
|    policy_gradient_loss | -0.011      |
|    std                  | 0.834       |
|    value_loss           | 5.08e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.72e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 53          |
|    time_elapsed         | 741         |
|    total_timesteps      | 108544      |
| train/                  |             |
|    approx_kl            | 0.015388653 |
|    clip_fraction        | 0.179       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.59e+04    |
|    n_updates            | 520         |
|    policy_gradient_loss | -0.0115     |
|    std                  | 0.836       |
|    value_loss           | 3.43e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 54          |
|    time_elapsed         | 755         |
|    total_timesteps      | 110592      |
| train/                  |             |
|    approx_kl            | 0.011160995 |
|    clip_fraction        | 0.123       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 3.9e+04     |
|    n_updates            | 530         |
|    policy_gradient_loss | -0.0146     |
|    std                  | 0.832       |
|    value_loss           | 8.16e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 55          |
|    time_elapsed         | 769         |
|    total_timesteps      | 112640      |
| train/                  |             |
|    approx_kl            | 0.013476456 |
|    clip_fraction        | 0.158       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 3.69e+04    |
|    n_updates            | 540         |
|    policy_gradient_loss | -0.00493    |
|    std                  | 0.841       |
|    value_loss           | 6.68e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 56          |
|    time_elapsed         | 783         |
|    total_timesteps      | 114688      |
| train/                  |             |
|    approx_kl            | 0.015881626 |
|    clip_fraction        | 0.173       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.5        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.83e+04    |
|    n_updates            | 550         |
|    policy_gradient_loss | -0.0252     |
|    std                  | 0.843       |
|    value_loss           | 3.78e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 57          |
|    time_elapsed         | 797         |
|    total_timesteps      | 116736      |
| train/                  |             |
|    approx_kl            | 0.026833735 |
|    clip_fraction        | 0.234       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.43e+04    |
|    n_updates            | 560         |
|    policy_gradient_loss | -0.00958    |
|    std                  | 0.828       |
|    value_loss           | 3.05e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 58          |
|    time_elapsed         | 812         |
|    total_timesteps      | 118784      |
| train/                  |             |
|    approx_kl            | 0.028344654 |
|    clip_fraction        | 0.278       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.4e+04     |
|    n_updates            | 570         |
|    policy_gradient_loss | 0.00196     |
|    std                  | 0.82        |
|    value_loss           | 2.68e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.74e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 59          |
|    time_elapsed         | 825         |
|    total_timesteps      | 120832      |
| train/                  |             |
|    approx_kl            | 0.015825741 |
|    clip_fraction        | 0.156       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.94e+04    |
|    n_updates            | 580         |
|    policy_gradient_loss | 0.000557    |
|    std                  | 0.826       |
|    value_loss           | 5.74e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.75e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 60         |
|    time_elapsed         | 839        |
|    total_timesteps      | 122880     |
| train/                  |            |
|    approx_kl            | 0.02055395 |
|    clip_fraction        | 0.19       |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.45      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 1.51e+04   |
|    n_updates            | 590        |
|    policy_gradient_loss | 0.0043     |
|    std                  | 0.819      |
|    value_loss           | 3.72e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.76e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 61          |
|    time_elapsed         | 853         |
|    total_timesteps      | 124928      |
| train/                  |             |
|    approx_kl            | 0.013689511 |
|    clip_fraction        | 0.14        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.54e+04    |
|    n_updates            | 600         |
|    policy_gradient_loss | -0.021      |
|    std                  | 0.819       |
|    value_loss           | 3.43e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.76e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 62          |
|    time_elapsed         | 867         |
|    total_timesteps      | 126976      |
| train/                  |             |
|    approx_kl            | 0.015221818 |
|    clip_fraction        | 0.168       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.43       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.61e+04    |
|    n_updates            | 610         |
|    policy_gradient_loss | -0.0285     |
|    std                  | 0.813       |
|    value_loss           | 3.37e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.76e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 63         |
|    time_elapsed         | 881        |
|    total_timesteps      | 129024     |
| train/                  |            |
|    approx_kl            | 0.04071191 |
|    clip_fraction        | 0.319      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.42      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 9.33e+03   |
|    n_updates            | 620        |
|    policy_gradient_loss | 0.011      |
|    std                  | 0.811      |
|    value_loss           | 1.98e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.77e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 64          |
|    time_elapsed         | 895         |
|    total_timesteps      | 131072      |
| train/                  |             |
|    approx_kl            | 0.017623218 |
|    clip_fraction        | 0.167       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.43       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8.13e+03    |
|    n_updates            | 630         |
|    policy_gradient_loss | -0.00306    |
|    std                  | 0.814       |
|    value_loss           | 1.64e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.77e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 65          |
|    time_elapsed         | 910         |
|    total_timesteps      | 133120      |
| train/                  |             |
|    approx_kl            | 0.016778994 |
|    clip_fraction        | 0.204       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.43       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 8.33e+03    |
|    n_updates            | 640         |
|    policy_gradient_loss | 0.00403     |
|    std                  | 0.815       |
|    value_loss           | 1.96e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.77e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 66          |
|    time_elapsed         | 924         |
|    total_timesteps      | 135168      |
| train/                  |             |
|    approx_kl            | 0.021337302 |
|    clip_fraction        | 0.164       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.42       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.65e+03    |
|    n_updates            | 650         |
|    policy_gradient_loss | 0.00748     |
|    std                  | 0.807       |
|    value_loss           | 1.62e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.77e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 67          |
|    time_elapsed         | 938         |
|    total_timesteps      | 137216      |
| train/                  |             |
|    approx_kl            | 0.008562895 |
|    clip_fraction        | 0.0779      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.06e+03    |
|    n_updates            | 660         |
|    policy_gradient_loss | -0.00562    |
|    std                  | 0.805       |
|    value_loss           | 1.56e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.78e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 68          |
|    time_elapsed         | 952         |
|    total_timesteps      | 139264      |
| train/                  |             |
|    approx_kl            | 0.009808671 |
|    clip_fraction        | 0.107       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 9.21e+03    |
|    n_updates            | 670         |
|    policy_gradient_loss | -0.0133     |
|    std                  | 0.801       |
|    value_loss           | 2.23e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.78e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 69          |
|    time_elapsed         | 966         |
|    total_timesteps      | 141312      |
| train/                  |             |
|    approx_kl            | 0.012630733 |
|    clip_fraction        | 0.118       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.12e+04    |
|    n_updates            | 680         |
|    policy_gradient_loss | -0.00732    |
|    std                  | 0.803       |
|    value_loss           | 2.18e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.79e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 70          |
|    time_elapsed         | 981         |
|    total_timesteps      | 143360      |
| train/                  |             |
|    approx_kl            | 0.012141417 |
|    clip_fraction        | 0.116       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.42e+04    |
|    n_updates            | 690         |
|    policy_gradient_loss | -0.0226     |
|    std                  | 0.795       |
|    value_loss           | 5.2e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.8e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 71          |
|    time_elapsed         | 995         |
|    total_timesteps      | 145408      |
| train/                  |             |
|    approx_kl            | 0.023457542 |
|    clip_fraction        | 0.255       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.07e+04    |
|    n_updates            | 700         |
|    policy_gradient_loss | -0.00289    |
|    std                  | 0.796       |
|    value_loss           | 2.84e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.8e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 72          |
|    time_elapsed         | 1009        |
|    total_timesteps      | 147456      |
| train/                  |             |
|    approx_kl            | 0.011387791 |
|    clip_fraction        | 0.13        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.26e+04    |
|    n_updates            | 710         |
|    policy_gradient_loss | -0.00732    |
|    std                  | 0.792       |
|    value_loss           | 4.41e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.81e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 73          |
|    time_elapsed         | 1023        |
|    total_timesteps      | 149504      |
| train/                  |             |
|    approx_kl            | 0.017695563 |
|    clip_fraction        | 0.173       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 2.38e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 8.58e+03    |
|    n_updates            | 720         |
|    policy_gradient_loss | -0.0087     |
|    std                  | 0.788       |
|    value_loss           | 1.87e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.81e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 74          |
|    time_elapsed         | 1037        |
|    total_timesteps      | 151552      |
| train/                  |             |
|    approx_kl            | 0.018687332 |
|    clip_fraction        | 0.163       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.59e+04    |
|    n_updates            | 730         |
|    policy_gradient_loss | 0.00265     |
|    std                  | 0.794       |
|    value_loss           | 3.09e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.81e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 75          |
|    time_elapsed         | 1052        |
|    total_timesteps      | 153600      |
| train/                  |             |
|    approx_kl            | 0.015589951 |
|    clip_fraction        | 0.124       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.37e+04    |
|    n_updates            | 740         |
|    policy_gradient_loss | -0.00322    |
|    std                  | 0.801       |
|    value_loss           | 2.91e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 76          |
|    time_elapsed         | 1067        |
|    total_timesteps      | 155648      |
| train/                  |             |
|    approx_kl            | 0.026954753 |
|    clip_fraction        | 0.211       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 7.6e+03     |
|    n_updates            | 750         |
|    policy_gradient_loss | 0.00466     |
|    std                  | 0.803       |
|    value_loss           | 1.77e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 77          |
|    time_elapsed         | 1081        |
|    total_timesteps      | 157696      |
| train/                  |             |
|    approx_kl            | 0.021868024 |
|    clip_fraction        | 0.171       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.55e+04    |
|    n_updates            | 760         |
|    policy_gradient_loss | -0.000461   |
|    std                  | 0.798       |
|    value_loss           | 2.71e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 78          |
|    time_elapsed         | 1095        |
|    total_timesteps      | 159744      |
| train/                  |             |
|    approx_kl            | 0.010552238 |
|    clip_fraction        | 0.145       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.31e+04    |
|    n_updates            | 770         |
|    policy_gradient_loss | -0.000139   |
|    std                  | 0.799       |
|    value_loss           | 2.61e+04    |
-----------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.82e+04   |
| time/                   |            |
|    fps                  | 145        |
|    iterations           | 79         |
|    time_elapsed         | 1109       |
|    total_timesteps      | 161792     |
| train/                  |            |
|    approx_kl            | 0.01820229 |
|    clip_fraction        | 0.185      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.38      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 7.76e+03   |
|    n_updates            | 780        |
|    policy_gradient_loss | 0.000961   |
|    std                  | 0.797      |
|    value_loss           | 1.66e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.83e+04   |
| time/                   |            |
|    fps                  | 145        |
|    iterations           | 80         |
|    time_elapsed         | 1123       |
|    total_timesteps      | 163840     |
| train/                  |            |
|    approx_kl            | 0.01317868 |
|    clip_fraction        | 0.149      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.37      |
|    explained_variance   | 5.96e-08   |
|    learning_rate        | 0.0003     |
|    loss                 | 1.53e+04   |
|    n_updates            | 790        |
|    policy_gradient_loss | 0.000614   |
|    std                  | 0.787      |
|    value_loss           | 2.74e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 81          |
|    time_elapsed         | 1137        |
|    total_timesteps      | 165888      |
| train/                  |             |
|    approx_kl            | 0.009161064 |
|    clip_fraction        | 0.142       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.01e+04    |
|    n_updates            | 800         |
|    policy_gradient_loss | -0.00327    |
|    std                  | 0.785       |
|    value_loss           | 2.47e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 82          |
|    time_elapsed         | 1151        |
|    total_timesteps      | 167936      |
| train/                  |             |
|    approx_kl            | 0.009845901 |
|    clip_fraction        | 0.154       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8.07e+03    |
|    n_updates            | 810         |
|    policy_gradient_loss | 0.000412    |
|    std                  | 0.789       |
|    value_loss           | 1.35e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.83e+04     |
| time/                   |              |
|    fps                  | 145          |
|    iterations           | 83           |
|    time_elapsed         | 1165         |
|    total_timesteps      | 169984       |
| train/                  |              |
|    approx_kl            | 0.0045108087 |
|    clip_fraction        | 0.0742       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.37        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.34e+04     |
|    n_updates            | 820          |
|    policy_gradient_loss | -0.000618    |
|    std                  | 0.793        |
|    value_loss           | 2.69e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.84e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 84          |
|    time_elapsed         | 1179        |
|    total_timesteps      | 172032      |
| train/                  |             |
|    approx_kl            | 0.007392233 |
|    clip_fraction        | 0.077       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 7.97e+03    |
|    n_updates            | 830         |
|    policy_gradient_loss | -4.53e-05   |
|    std                  | 0.803       |
|    value_loss           | 1.55e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.85e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 85          |
|    time_elapsed         | 1192        |
|    total_timesteps      | 174080      |
| train/                  |             |
|    approx_kl            | 0.007693232 |
|    clip_fraction        | 0.0707      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.41e+04    |
|    n_updates            | 840         |
|    policy_gradient_loss | -0.0114     |
|    std                  | 0.805       |
|    value_loss           | 6.44e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.86e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 86          |
|    time_elapsed         | 1206        |
|    total_timesteps      | 176128      |
| train/                  |             |
|    approx_kl            | 0.003904311 |
|    clip_fraction        | 0.0364      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.42e+04    |
|    n_updates            | 850         |
|    policy_gradient_loss | -0.00264    |
|    std                  | 0.805       |
|    value_loss           | 5.99e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.85e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 87          |
|    time_elapsed         | 1220        |
|    total_timesteps      | 178176      |
| train/                  |             |
|    approx_kl            | 0.010545602 |
|    clip_fraction        | 0.105       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 9.32e+03    |
|    n_updates            | 860         |
|    policy_gradient_loss | 0.00275     |
|    std                  | 0.796       |
|    value_loss           | 1.8e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.85e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 88           |
|    time_elapsed         | 1234         |
|    total_timesteps      | 180224       |
| train/                  |              |
|    approx_kl            | 0.0038952979 |
|    clip_fraction        | 0.0241       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 1.68e+04     |
|    n_updates            | 870          |
|    policy_gradient_loss | 0.00032      |
|    std                  | 0.799        |
|    value_loss           | 3.36e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.85e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 89           |
|    time_elapsed         | 1248         |
|    total_timesteps      | 182272       |
| train/                  |              |
|    approx_kl            | 0.0048363013 |
|    clip_fraction        | 0.0596       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.55e+04     |
|    n_updates            | 880          |
|    policy_gradient_loss | -0.00258     |
|    std                  | 0.807        |
|    value_loss           | 2.86e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.86e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 90          |
|    time_elapsed         | 1262        |
|    total_timesteps      | 184320      |
| train/                  |             |
|    approx_kl            | 0.005844402 |
|    clip_fraction        | 0.0595      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.69e+04    |
|    n_updates            | 890         |
|    policy_gradient_loss | -0.00509    |
|    std                  | 0.799       |
|    value_loss           | 4.7e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.86e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 91           |
|    time_elapsed         | 1276         |
|    total_timesteps      | 186368       |
| train/                  |              |
|    approx_kl            | 0.0035861044 |
|    clip_fraction        | 0.0293       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 2.3e+04      |
|    n_updates            | 900          |
|    policy_gradient_loss | -0.00208     |
|    std                  | 0.796        |
|    value_loss           | 4.29e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.86e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 92          |
|    time_elapsed         | 1290        |
|    total_timesteps      | 188416      |
| train/                  |             |
|    approx_kl            | 0.008172901 |
|    clip_fraction        | 0.0651      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.9e+04     |
|    n_updates            | 910         |
|    policy_gradient_loss | -0.00517    |
|    std                  | 0.796       |
|    value_loss           | 4.44e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.87e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 93           |
|    time_elapsed         | 1303         |
|    total_timesteps      | 190464       |
| train/                  |              |
|    approx_kl            | 0.0052236803 |
|    clip_fraction        | 0.0422       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.46e+04     |
|    n_updates            | 920          |
|    policy_gradient_loss | -0.00326     |
|    std                  | 0.792        |
|    value_loss           | 2.86e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.87e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 94          |
|    time_elapsed         | 1318        |
|    total_timesteps      | 192512      |
| train/                  |             |
|    approx_kl            | 0.006089763 |
|    clip_fraction        | 0.0486      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.73e+04    |
|    n_updates            | 930         |
|    policy_gradient_loss | -0.0059     |
|    std                  | 0.795       |
|    value_loss           | 6.3e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.87e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 95          |
|    time_elapsed         | 1332        |
|    total_timesteps      | 194560      |
| train/                  |             |
|    approx_kl            | 0.007236196 |
|    clip_fraction        | 0.0645      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.39e+04    |
|    n_updates            | 940         |
|    policy_gradient_loss | -0.00312    |
|    std                  | 0.785       |
|    value_loss           | 6.63e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.88e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 96          |
|    time_elapsed         | 1345        |
|    total_timesteps      | 196608      |
| train/                  |             |
|    approx_kl            | 0.009198414 |
|    clip_fraction        | 0.122       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.32e+04    |
|    n_updates            | 950         |
|    policy_gradient_loss | -0.00422    |
|    std                  | 0.782       |
|    value_loss           | 2.8e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.88e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 97          |
|    time_elapsed         | 1359        |
|    total_timesteps      | 198656      |
| train/                  |             |
|    approx_kl            | 0.011152923 |
|    clip_fraction        | 0.0958      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.34e+04    |
|    n_updates            | 960         |
|    policy_gradient_loss | -0.00434    |
|    std                  | 0.785       |
|    value_loss           | 4.03e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.89e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 98          |
|    time_elapsed         | 1373        |
|    total_timesteps      | 200704      |
| train/                  |             |
|    approx_kl            | 0.006587811 |
|    clip_fraction        | 0.0738      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.81e+03    |
|    n_updates            | 970         |
|    policy_gradient_loss | -0.00277    |
|    std                  | 0.799       |
|    value_loss           | 1.71e+04    |
-----------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.9e+04    |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 99         |
|    time_elapsed         | 1387       |
|    total_timesteps      | 202752     |
| train/                  |            |
|    approx_kl            | 0.01411744 |
|    clip_fraction        | 0.0879     |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.4       |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 4.55e+04   |
|    n_updates            | 980        |
|    policy_gradient_loss | -0.00203   |
|    std                  | 0.804      |
|    value_loss           | 7.91e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.9e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 100         |
|    time_elapsed         | 1401        |
|    total_timesteps      | 204800      |
| train/                  |             |
|    approx_kl            | 0.013300964 |
|    clip_fraction        | 0.139       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 3.17e+04    |
|    n_updates            | 990         |
|    policy_gradient_loss | -0.0212     |
|    std                  | 0.793       |
|    value_loss           | 6.25e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.89e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 101         |
|    time_elapsed         | 1415        |
|    total_timesteps      | 206848      |
| train/                  |             |
|    approx_kl            | 0.010988854 |
|    clip_fraction        | 0.116       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.79e+04    |
|    n_updates            | 1000        |
|    policy_gradient_loss | -0.000685   |
|    std                  | 0.797       |
|    value_loss           | 3.73e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.89e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 102         |
|    time_elapsed         | 1429        |
|    total_timesteps      | 208896      |
| train/                  |             |
|    approx_kl            | 0.020069811 |
|    clip_fraction        | 0.228       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 9.58e+03    |
|    n_updates            | 1010        |
|    policy_gradient_loss | 0.00113     |
|    std                  | 0.793       |
|    value_loss           | 1.88e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.9e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 103         |
|    time_elapsed         | 1442        |
|    total_timesteps      | 210944      |
| train/                  |             |
|    approx_kl            | 0.010540705 |
|    clip_fraction        | 0.141       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.46e+04    |
|    n_updates            | 1020        |
|    policy_gradient_loss | 0.0011      |
|    std                  | 0.796       |
|    value_loss           | 3.87e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 104         |
|    time_elapsed         | 1456        |
|    total_timesteps      | 212992      |
| train/                  |             |
|    approx_kl            | 0.009418109 |
|    clip_fraction        | 0.115       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.64e+04    |
|    n_updates            | 1030        |
|    policy_gradient_loss | -0.00633    |
|    std                  | 0.791       |
|    value_loss           | 3.95e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 105         |
|    time_elapsed         | 1471        |
|    total_timesteps      | 215040      |
| train/                  |             |
|    approx_kl            | 0.012258687 |
|    clip_fraction        | 0.126       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.26e+04    |
|    n_updates            | 1040        |
|    policy_gradient_loss | -0.00352    |
|    std                  | 0.8         |
|    value_loss           | 3.1e+04     |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 106         |
|    time_elapsed         | 1484        |
|    total_timesteps      | 217088      |
| train/                  |             |
|    approx_kl            | 0.012993254 |
|    clip_fraction        | 0.159       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 7.52e+03    |
|    n_updates            | 1050        |
|    policy_gradient_loss | -0.00172    |
|    std                  | 0.801       |
|    value_loss           | 1.62e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 107         |
|    time_elapsed         | 1498        |
|    total_timesteps      | 219136      |
| train/                  |             |
|    approx_kl            | 0.016626261 |
|    clip_fraction        | 0.13        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.26e+04    |
|    n_updates            | 1060        |
|    policy_gradient_loss | -0.00246    |
|    std                  | 0.807       |
|    value_loss           | 2.54e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 108         |
|    time_elapsed         | 1512        |
|    total_timesteps      | 221184      |
| train/                  |             |
|    approx_kl            | 0.011392436 |
|    clip_fraction        | 0.127       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.26e+04    |
|    n_updates            | 1070        |
|    policy_gradient_loss | -0.0107     |
|    std                  | 0.805       |
|    value_loss           | 2.62e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 109         |
|    time_elapsed         | 1525        |
|    total_timesteps      | 223232      |
| train/                  |             |
|    approx_kl            | 0.009496073 |
|    clip_fraction        | 0.0987      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.8e+04     |
|    n_updates            | 1080        |
|    policy_gradient_loss | -0.00546    |
|    std                  | 0.8         |
|    value_loss           | 3.46e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 110         |
|    time_elapsed         | 1540        |
|    total_timesteps      | 225280      |
| train/                  |             |
|    approx_kl            | 0.012582979 |
|    clip_fraction        | 0.168       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.79e+04    |
|    n_updates            | 1090        |
|    policy_gradient_loss | -0.00456    |
|    std                  | 0.8         |
|    value_loss           | 3.6e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 111         |
|    time_elapsed         | 1553        |
|    total_timesteps      | 227328      |
| train/                  |             |
|    approx_kl            | 0.022164816 |
|    clip_fraction        | 0.167       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 6.02e+03    |
|    n_updates            | 1100        |
|    policy_gradient_loss | 0.00299     |
|    std                  | 0.813       |
|    value_loss           | 1.3e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 112         |
|    time_elapsed         | 1567        |
|    total_timesteps      | 229376      |
| train/                  |             |
|    approx_kl            | 0.008020125 |
|    clip_fraction        | 0.0919      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.42       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.25e+04    |
|    n_updates            | 1110        |
|    policy_gradient_loss | -0.00131    |
|    std                  | 0.808       |
|    value_loss           | 5.24e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 113         |
|    time_elapsed         | 1581        |
|    total_timesteps      | 231424      |
| train/                  |             |
|    approx_kl            | 0.007745044 |
|    clip_fraction        | 0.0853      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.7e+04     |
|    n_updates            | 1120        |
|    policy_gradient_loss | -0.00879    |
|    std                  | 0.808       |
|    value_loss           | 2.93e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.82e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 114          |
|    time_elapsed         | 1596         |
|    total_timesteps      | 233472       |
| train/                  |              |
|    approx_kl            | 0.0050633173 |
|    clip_fraction        | 0.0913       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.13e+04     |
|    n_updates            | 1130         |
|    policy_gradient_loss | 0.00214      |
|    std                  | 0.794        |
|    value_loss           | 2.24e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 115         |
|    time_elapsed         | 1610        |
|    total_timesteps      | 235520      |
| train/                  |             |
|    approx_kl            | 0.009911083 |
|    clip_fraction        | 0.113       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.08e+04    |
|    n_updates            | 1140        |
|    policy_gradient_loss | -0.00607    |
|    std                  | 0.792       |
|    value_loss           | 2.13e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 116         |
|    time_elapsed         | 1624        |
|    total_timesteps      | 237568      |
| train/                  |             |
|    approx_kl            | 0.013709651 |
|    clip_fraction        | 0.132       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.92e+04    |
|    n_updates            | 1150        |
|    policy_gradient_loss | -0.018      |
|    std                  | 0.796       |
|    value_loss           | 3.45e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 117         |
|    time_elapsed         | 1638        |
|    total_timesteps      | 239616      |
| train/                  |             |
|    approx_kl            | 0.012580525 |
|    clip_fraction        | 0.136       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.82e+04    |
|    n_updates            | 1160        |
|    policy_gradient_loss | 0.00117     |
|    std                  | 0.795       |
|    value_loss           | 3.49e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.84e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 118         |
|    time_elapsed         | 1652        |
|    total_timesteps      | 241664      |
| train/                  |             |
|    approx_kl            | 0.012209925 |
|    clip_fraction        | 0.141       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.32e+04    |
|    n_updates            | 1170        |
|    policy_gradient_loss | -0.00163    |
|    std                  | 0.793       |
|    value_loss           | 2.49e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.85e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 119         |
|    time_elapsed         | 1667        |
|    total_timesteps      | 243712      |
| train/                  |             |
|    approx_kl            | 0.014715998 |
|    clip_fraction        | 0.148       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.49e+04    |
|    n_updates            | 1180        |
|    policy_gradient_loss | -0.0196     |
|    std                  | 0.787       |
|    value_loss           | 3.04e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.85e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 120         |
|    time_elapsed         | 1681        |
|    total_timesteps      | 245760      |
| train/                  |             |
|    approx_kl            | 0.012587525 |
|    clip_fraction        | 0.0777      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.2e+04     |
|    n_updates            | 1190        |
|    policy_gradient_loss | -0.00513    |
|    std                  | 0.78        |
|    value_loss           | 6.58e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.86e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 121         |
|    time_elapsed         | 1695        |
|    total_timesteps      | 247808      |
| train/                  |             |
|    approx_kl            | 0.017470002 |
|    clip_fraction        | 0.16        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.34e+04    |
|    n_updates            | 1200        |
|    policy_gradient_loss | 0.000161    |
|    std                  | 0.787       |
|    value_loss           | 2.82e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.87e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 122         |
|    time_elapsed         | 1710        |
|    total_timesteps      | 249856      |
| train/                  |             |
|    approx_kl            | 0.012832021 |
|    clip_fraction        | 0.123       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.17e+04    |
|    n_updates            | 1210        |
|    policy_gradient_loss | -0.000444   |
|    std                  | 0.783       |
|    value_loss           | 3.83e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.88e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 123         |
|    time_elapsed         | 1723        |
|    total_timesteps      | 251904      |
| train/                  |             |
|    approx_kl            | 0.014430864 |
|    clip_fraction        | 0.149       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.04e+04    |
|    n_updates            | 1220        |
|    policy_gradient_loss | -0.00634    |
|    std                  | 0.788       |
|    value_loss           | 1.51e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.89e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 124         |
|    time_elapsed         | 1737        |
|    total_timesteps      | 253952      |
| train/                  |             |
|    approx_kl            | 0.014055605 |
|    clip_fraction        | 0.124       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.82e+04    |
|    n_updates            | 1230        |
|    policy_gradient_loss | -0.0191     |
|    std                  | 0.785       |
|    value_loss           | 4.33e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.91e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 125         |
|    time_elapsed         | 1751        |
|    total_timesteps      | 256000      |
| train/                  |             |
|    approx_kl            | 0.016250223 |
|    clip_fraction        | 0.169       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.46e+04    |
|    n_updates            | 1240        |
|    policy_gradient_loss | -0.00511    |
|    std                  | 0.789       |
|    value_loss           | 2.91e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.94e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 126         |
|    time_elapsed         | 1765        |
|    total_timesteps      | 258048      |
| train/                  |             |
|    approx_kl            | 0.011430523 |
|    clip_fraction        | 0.108       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.07e+04    |
|    n_updates            | 1250        |
|    policy_gradient_loss | 0.000287    |
|    std                  | 0.78        |
|    value_loss           | 4.04e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.94e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 127         |
|    time_elapsed         | 1780        |
|    total_timesteps      | 260096      |
| train/                  |             |
|    approx_kl            | 0.012471996 |
|    clip_fraction        | 0.0835      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 6.54e+04    |
|    n_updates            | 1260        |
|    policy_gradient_loss | -0.00831    |
|    std                  | 0.784       |
|    value_loss           | 1.33e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.95e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 128         |
|    time_elapsed         | 1794        |
|    total_timesteps      | 262144      |
| train/                  |             |
|    approx_kl            | 0.008992329 |
|    clip_fraction        | 0.0826      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.44e+04    |
|    n_updates            | 1270        |
|    policy_gradient_loss | -0.000448   |
|    std                  | 0.791       |
|    value_loss           | 3.41e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.96e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 129         |
|    time_elapsed         | 1808        |
|    total_timesteps      | 264192      |
| train/                  |             |
|    approx_kl            | 0.011706731 |
|    clip_fraction        | 0.13        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.73e+04    |
|    n_updates            | 1280        |
|    policy_gradient_loss | -0.00362    |
|    std                  | 0.785       |
|    value_loss           | 5.66e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.98e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 130         |
|    time_elapsed         | 1822        |
|    total_timesteps      | 266240      |
| train/                  |             |
|    approx_kl            | 0.013437878 |
|    clip_fraction        | 0.155       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.45e+04    |
|    n_updates            | 1290        |
|    policy_gradient_loss | -0.000298   |
|    std                  | 0.788       |
|    value_loss           | 6.05e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2e+04       |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 131         |
|    time_elapsed         | 1835        |
|    total_timesteps      | 268288      |
| train/                  |             |
|    approx_kl            | 0.006905757 |
|    clip_fraction        | 0.0843      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8.57e+04    |
|    n_updates            | 1300        |
|    policy_gradient_loss | -0.0066     |
|    std                  | 0.79        |
|    value_loss           | 1.43e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.03e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 132         |
|    time_elapsed         | 1849        |
|    total_timesteps      | 270336      |
| train/                  |             |
|    approx_kl            | 0.010834164 |
|    clip_fraction        | 0.129       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.93e+04    |
|    n_updates            | 1310        |
|    policy_gradient_loss | -0.00354    |
|    std                  | 0.786       |
|    value_loss           | 4.28e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.03e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 133         |
|    time_elapsed         | 1862        |
|    total_timesteps      | 272384      |
| train/                  |             |
|    approx_kl            | 0.009356933 |
|    clip_fraction        | 0.118       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 5.64e+04    |
|    n_updates            | 1320        |
|    policy_gradient_loss | -0.000485   |
|    std                  | 0.79        |
|    value_loss           | 1.04e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.04e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 134         |
|    time_elapsed         | 1876        |
|    total_timesteps      | 274432      |
| train/                  |             |
|    approx_kl            | 0.017256424 |
|    clip_fraction        | 0.203       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.22e+04    |
|    n_updates            | 1330        |
|    policy_gradient_loss | 0.000761    |
|    std                  | 0.79        |
|    value_loss           | 1.97e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.07e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 135         |
|    time_elapsed         | 1890        |
|    total_timesteps      | 276480      |
| train/                  |             |
|    approx_kl            | 0.016726445 |
|    clip_fraction        | 0.161       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 2.15e+04    |
|    n_updates            | 1340        |
|    policy_gradient_loss | -0.0122     |
|    std                  | 0.791       |
|    value_loss           | 4.34e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.12e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 136         |
|    time_elapsed         | 1904        |
|    total_timesteps      | 278528      |
| train/                  |             |
|    approx_kl            | 0.010385685 |
|    clip_fraction        | 0.0725      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 5.79e+04    |
|    n_updates            | 1350        |
|    policy_gradient_loss | -0.00434    |
|    std                  | 0.792       |
|    value_loss           | 1.09e+05    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.14e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 137         |
|    time_elapsed         | 1918        |
|    total_timesteps      | 280576      |
| train/                  |             |
|    approx_kl            | 0.007573339 |
|    clip_fraction        | 0.0746      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.96e+05    |
|    n_updates            | 1360        |
|    policy_gradient_loss | -0.00349    |
|    std                  | 0.787       |
|    value_loss           | 3.02e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 138          |
|    time_elapsed         | 1931         |
|    total_timesteps      | 282624       |
| train/                  |              |
|    approx_kl            | 0.0070940517 |
|    clip_fraction        | 0.061        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.37        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 5.67e+04     |
|    n_updates            | 1370         |
|    policy_gradient_loss | -0.00315     |
|    std                  | 0.793        |
|    value_loss           | 1.01e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.2e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 139         |
|    time_elapsed         | 1945        |
|    total_timesteps      | 284672      |
| train/                  |             |
|    approx_kl            | 0.014831897 |
|    clip_fraction        | 0.139       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 5.4e+04     |
|    n_updates            | 1380        |
|    policy_gradient_loss | -0.0122     |
|    std                  | 0.788       |
|    value_loss           | 9.77e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.22e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 140         |
|    time_elapsed         | 1959        |
|    total_timesteps      | 286720      |
| train/                  |             |
|    approx_kl            | 0.009213081 |
|    clip_fraction        | 0.0839      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.25e+05    |
|    n_updates            | 1390        |
|    policy_gradient_loss | -0.00645    |
|    std                  | 0.791       |
|    value_loss           | 1.94e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.26e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 141         |
|    time_elapsed         | 1972        |
|    total_timesteps      | 288768      |
| train/                  |             |
|    approx_kl            | 0.006149709 |
|    clip_fraction        | 0.0662      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8e+04       |
|    n_updates            | 1400        |
|    policy_gradient_loss | -0.00861    |
|    std                  | 0.788       |
|    value_loss           | 1.55e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.29e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 142         |
|    time_elapsed         | 1986        |
|    total_timesteps      | 290816      |
| train/                  |             |
|    approx_kl            | 0.006930629 |
|    clip_fraction        | 0.0487      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 5.58e+04    |
|    n_updates            | 1410        |
|    policy_gradient_loss | -0.00344    |
|    std                  | 0.788       |
|    value_loss           | 1.27e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.32e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 143        |
|    time_elapsed         | 2001       |
|    total_timesteps      | 292864     |
| train/                  |            |
|    approx_kl            | 0.02277663 |
|    clip_fraction        | 0.25       |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.36      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 8.34e+04   |
|    n_updates            | 1420       |
|    policy_gradient_loss | 0.000407   |
|    std                  | 0.787      |
|    value_loss           | 1.83e+05   |
----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.32e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 144         |
|    time_elapsed         | 2015        |
|    total_timesteps      | 294912      |
| train/                  |             |
|    approx_kl            | 0.008937445 |
|    clip_fraction        | 0.0673      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.12e+05    |
|    n_updates            | 1430        |
|    policy_gradient_loss | -0.0128     |
|    std                  | 0.787       |
|    value_loss           | 2.2e+05     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 145         |
|    time_elapsed         | 2029        |
|    total_timesteps      | 296960      |
| train/                  |             |
|    approx_kl            | 0.018521799 |
|    clip_fraction        | 0.169       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.56e+04    |
|    n_updates            | 1440        |
|    policy_gradient_loss | 0.00163     |
|    std                  | 0.791       |
|    value_loss           | 2.76e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.37e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 146         |
|    time_elapsed         | 2043        |
|    total_timesteps      | 299008      |
| train/                  |             |
|    approx_kl            | 0.009504773 |
|    clip_fraction        | 0.0929      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 4.66e+04    |
|    n_updates            | 1450        |
|    policy_gradient_loss | -0.0122     |
|    std                  | 0.791       |
|    value_loss           | 1.29e+05    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.39e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 147         |
|    time_elapsed         | 2057        |
|    total_timesteps      | 301056      |
| train/                  |             |
|    approx_kl            | 0.010224592 |
|    clip_fraction        | 0.0879      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 5.47e+04    |
|    n_updates            | 1460        |
|    policy_gradient_loss | -0.011      |
|    std                  | 0.786       |
|    value_loss           | 1.05e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.39e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 148          |
|    time_elapsed         | 2071         |
|    total_timesteps      | 303104       |
| train/                  |              |
|    approx_kl            | 0.0090159215 |
|    clip_fraction        | 0.0808       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.35        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 3.04e+04     |
|    n_updates            | 1470         |
|    policy_gradient_loss | -0.00925     |
|    std                  | 0.784        |
|    value_loss           | 7.15e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.4e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 149         |
|    time_elapsed         | 2086        |
|    total_timesteps      | 305152      |
| train/                  |             |
|    approx_kl            | 0.012324146 |
|    clip_fraction        | 0.104       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.34       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.83e+04    |
|    n_updates            | 1480        |
|    policy_gradient_loss | -0.00913    |
|    std                  | 0.778       |
|    value_loss           | 6.28e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.44e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 150         |
|    time_elapsed         | 2100        |
|    total_timesteps      | 307200      |
| train/                  |             |
|    approx_kl            | 0.021044672 |
|    clip_fraction        | 0.224       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 2.7e+04     |
|    n_updates            | 1490        |
|    policy_gradient_loss | 0.00276     |
|    std                  | 0.769       |
|    value_loss           | 6.01e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.45e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 151         |
|    time_elapsed         | 2114        |
|    total_timesteps      | 309248      |
| train/                  |             |
|    approx_kl            | 0.010620867 |
|    clip_fraction        | 0.0963      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.31       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.11e+05    |
|    n_updates            | 1500        |
|    policy_gradient_loss | -0.00823    |
|    std                  | 0.768       |
|    value_loss           | 1.93e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.45e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 152         |
|    time_elapsed         | 2128        |
|    total_timesteps      | 311296      |
| train/                  |             |
|    approx_kl            | 0.009820145 |
|    clip_fraction        | 0.0984      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.57e+04    |
|    n_updates            | 1510        |
|    policy_gradient_loss | -0.00385    |
|    std                  | 0.774       |
|    value_loss           | 4.87e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.47e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 153         |
|    time_elapsed         | 2141        |
|    total_timesteps      | 313344      |
| train/                  |             |
|    approx_kl            | 0.039277826 |
|    clip_fraction        | 0.188       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 4.78e+04    |
|    n_updates            | 1520        |
|    policy_gradient_loss | 0.00633     |
|    std                  | 0.772       |
|    value_loss           | 1.02e+05    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.47e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 154         |
|    time_elapsed         | 2155        |
|    total_timesteps      | 315392      |
| train/                  |             |
|    approx_kl            | 0.022092113 |
|    clip_fraction        | 0.17        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.24e+04    |
|    n_updates            | 1530        |
|    policy_gradient_loss | 0.00478     |
|    std                  | 0.772       |
|    value_loss           | 5.83e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.5e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 155         |
|    time_elapsed         | 2168        |
|    total_timesteps      | 317440      |
| train/                  |             |
|    approx_kl            | 0.010579394 |
|    clip_fraction        | 0.125       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.14e+04    |
|    n_updates            | 1540        |
|    policy_gradient_loss | -0.0027     |
|    std                  | 0.774       |
|    value_loss           | 4.66e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.49e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 156         |
|    time_elapsed         | 2183        |
|    total_timesteps      | 319488      |
| train/                  |             |
|    approx_kl            | 0.010778338 |
|    clip_fraction        | 0.0829      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 5.97e+04    |
|    n_updates            | 1550        |
|    policy_gradient_loss | -0.00432    |
|    std                  | 0.772       |
|    value_loss           | 1.23e+05    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.49e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 157         |
|    time_elapsed         | 2197        |
|    total_timesteps      | 321536      |
| train/                  |             |
|    approx_kl            | 0.017274696 |
|    clip_fraction        | 0.183       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.33       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 8.04e+03    |
|    n_updates            | 1560        |
|    policy_gradient_loss | 0.000794    |
|    std                  | 0.783       |
|    value_loss           | 1.86e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.48e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 158         |
|    time_elapsed         | 2211        |
|    total_timesteps      | 323584      |
| train/                  |             |
|    approx_kl            | 0.034241498 |
|    clip_fraction        | 0.183       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 5.16e+03    |
|    n_updates            | 1570        |
|    policy_gradient_loss | 0.00284     |
|    std                  | 0.786       |
|    value_loss           | 1.15e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 1.2e+03   |
|    ep_rew_mean          | 2.48e+04  |
| time/                   |           |
|    fps                  | 146       |
|    iterations           | 159       |
|    time_elapsed         | 2225      |
|    total_timesteps      | 325632    |
| train/                  |           |
|    approx_kl            | 0.3389376 |
|    clip_fraction        | 0.471     |
|    clip_range           | 0.2       |
|    entropy_loss         | -2.43     |
|    explained_variance   | 0         |
|    learning_rate        | 0.0003    |
|    loss                 | 1.96e+03  |
|    n_updates            | 1580      |
|    policy_gradient_loss | 0.019     |
|    std                  | 0.835     |
|    value_loss           | 9.1e+03   |
---------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.48e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 160         |
|    time_elapsed         | 2239        |
|    total_timesteps      | 327680      |
| train/                  |             |
|    approx_kl            | 0.005281109 |
|    clip_fraction        | 0.0663      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.78e+04    |
|    n_updates            | 1590        |
|    policy_gradient_loss | -0.00419    |
|    std                  | 0.837       |
|    value_loss           | 3.84e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.48e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 161         |
|    time_elapsed         | 2253        |
|    total_timesteps      | 329728      |
| train/                  |             |
|    approx_kl            | 0.005753454 |
|    clip_fraction        | 0.085       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 4.91e+03    |
|    n_updates            | 1600        |
|    policy_gradient_loss | 0.000773    |
|    std                  | 0.835       |
|    value_loss           | 1.32e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.5e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 162          |
|    time_elapsed         | 2267         |
|    total_timesteps      | 331776       |
| train/                  |              |
|    approx_kl            | 0.0048351064 |
|    clip_fraction        | 0.0298       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.47        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.47e+04     |
|    n_updates            | 1610         |
|    policy_gradient_loss | -0.0025      |
|    std                  | 0.834        |
|    value_loss           | 5.31e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.51e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 163          |
|    time_elapsed         | 2280         |
|    total_timesteps      | 333824       |
| train/                  |              |
|    approx_kl            | 0.0068735047 |
|    clip_fraction        | 0.059        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.47        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.23e+04     |
|    n_updates            | 1620         |
|    policy_gradient_loss | -0.00626     |
|    std                  | 0.834        |
|    value_loss           | 7.44e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.51e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 164         |
|    time_elapsed         | 2294        |
|    total_timesteps      | 335872      |
| train/                  |             |
|    approx_kl            | 0.009292517 |
|    clip_fraction        | 0.0956      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.75e+04    |
|    n_updates            | 1630        |
|    policy_gradient_loss | -0.0124     |
|    std                  | 0.832       |
|    value_loss           | 2.73e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.52e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 165          |
|    time_elapsed         | 2308         |
|    total_timesteps      | 337920       |
| train/                  |              |
|    approx_kl            | 0.0064372486 |
|    clip_fraction        | 0.0664       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 2.31e+04     |
|    n_updates            | 1640         |
|    policy_gradient_loss | -0.0029      |
|    std                  | 0.83         |
|    value_loss           | 5.65e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.54e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 166          |
|    time_elapsed         | 2322         |
|    total_timesteps      | 339968       |
| train/                  |              |
|    approx_kl            | 0.0118397325 |
|    clip_fraction        | 0.183        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.12e+04     |
|    n_updates            | 1650         |
|    policy_gradient_loss | 0.00627      |
|    std                  | 0.833        |
|    value_loss           | 1.55e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.55e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 167         |
|    time_elapsed         | 2337        |
|    total_timesteps      | 342016      |
| train/                  |             |
|    approx_kl            | 0.003156255 |
|    clip_fraction        | 0.0204      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8.21e+04    |
|    n_updates            | 1660        |
|    policy_gradient_loss | -0.000906   |
|    std                  | 0.833       |
|    value_loss           | 1.49e+05    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.57e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 168          |
|    time_elapsed         | 2351         |
|    total_timesteps      | 344064       |
| train/                  |              |
|    approx_kl            | 0.0041007777 |
|    clip_fraction        | 0.0239       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.47        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 4.92e+04     |
|    n_updates            | 1670         |
|    policy_gradient_loss | -0.00197     |
|    std                  | 0.832        |
|    value_loss           | 8.43e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.58e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 169          |
|    time_elapsed         | 2365         |
|    total_timesteps      | 346112       |
| train/                  |              |
|    approx_kl            | 0.0029526413 |
|    clip_fraction        | 0.0184       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.47        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 6.44e+04     |
|    n_updates            | 1680         |
|    policy_gradient_loss | -0.00202     |
|    std                  | 0.833        |
|    value_loss           | 1.13e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.58e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 170         |
|    time_elapsed         | 2379        |
|    total_timesteps      | 348160      |
| train/                  |             |
|    approx_kl            | 0.007881822 |
|    clip_fraction        | 0.0965      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.46       |
|    explained_variance   | -2.38e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 9.15e+03    |
|    n_updates            | 1690        |
|    policy_gradient_loss | -0.00135    |
|    std                  | 0.823       |
|    value_loss           | 2.51e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.58e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 171          |
|    time_elapsed         | 2393         |
|    total_timesteps      | 350208       |
| train/                  |              |
|    approx_kl            | 0.0045934375 |
|    clip_fraction        | 0.0451       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 2.02e+04     |
|    n_updates            | 1700         |
|    policy_gradient_loss | 7.48e-05     |
|    std                  | 0.825        |
|    value_loss           | 4.4e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 1.2e+03   |
|    ep_rew_mean          | 2.59e+04  |
| time/                   |           |
|    fps                  | 146       |
|    iterations           | 172       |
|    time_elapsed         | 2407      |
|    total_timesteps      | 352256    |
| train/                  |           |
|    approx_kl            | 0.0055109 |
|    clip_fraction        | 0.0672    |
|    clip_range           | 0.2       |
|    entropy_loss         | -2.44     |
|    explained_variance   | 5.96e-08  |
|    learning_rate        | 0.0003    |
|    loss                 | 1.64e+04  |
|    n_updates            | 1710      |
|    policy_gradient_loss | 0.00243   |
|    std                  | 0.821     |
|    value_loss           | 3.85e+04  |
---------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.62e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 173         |
|    time_elapsed         | 2421        |
|    total_timesteps      | 354304      |
| train/                  |             |
|    approx_kl            | 0.005828525 |
|    clip_fraction        | 0.0809      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.34e+04    |
|    n_updates            | 1720        |
|    policy_gradient_loss | 0.0044      |
|    std                  | 0.822       |
|    value_loss           | 3.74e+04    |
-----------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.62e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 174        |
|    time_elapsed         | 2435       |
|    total_timesteps      | 356352     |
| train/                  |            |
|    approx_kl            | 0.00395523 |
|    clip_fraction        | 0.0248     |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.44      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 7.21e+04   |
|    n_updates            | 1730       |
|    policy_gradient_loss | -0.00267   |
|    std                  | 0.817      |
|    value_loss           | 1.65e+05   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.63e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 175         |
|    time_elapsed         | 2449        |
|    total_timesteps      | 358400      |
| train/                  |             |
|    approx_kl            | 0.006548295 |
|    clip_fraction        | 0.0367      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.43       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.54e+04    |
|    n_updates            | 1740        |
|    policy_gradient_loss | -0.00366    |
|    std                  | 0.815       |
|    value_loss           | 2.5e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.63e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 176          |
|    time_elapsed         | 2463         |
|    total_timesteps      | 360448       |
| train/                  |              |
|    approx_kl            | 0.0050562853 |
|    clip_fraction        | 0.0362       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 3.59e+04     |
|    n_updates            | 1750         |
|    policy_gradient_loss | -0.00158     |
|    std                  | 0.81         |
|    value_loss           | 5.88e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.62e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 177         |
|    time_elapsed         | 2477        |
|    total_timesteps      | 362496      |
| train/                  |             |
|    approx_kl            | 0.046167284 |
|    clip_fraction        | 0.241       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 4.45e+03    |
|    n_updates            | 1760        |
|    policy_gradient_loss | 0.00491     |
|    std                  | 0.804       |
|    value_loss           | 1.21e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.61e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 178         |
|    time_elapsed         | 2492        |
|    total_timesteps      | 364544      |
| train/                  |             |
|    approx_kl            | 0.016748011 |
|    clip_fraction        | 0.11        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.36e+03    |
|    n_updates            | 1770        |
|    policy_gradient_loss | -0.00313    |
|    std                  | 0.809       |
|    value_loss           | 1.6e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.65e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 179          |
|    time_elapsed         | 2506         |
|    total_timesteps      | 366592       |
| train/                  |              |
|    approx_kl            | 0.0056960853 |
|    clip_fraction        | 0.0494       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 2.12e+04     |
|    n_updates            | 1780         |
|    policy_gradient_loss | -0.00719     |
|    std                  | 0.809        |
|    value_loss           | 4.06e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.67e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 180          |
|    time_elapsed         | 2519         |
|    total_timesteps      | 368640       |
| train/                  |              |
|    approx_kl            | 0.0038355822 |
|    clip_fraction        | 0.017        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.16e+05     |
|    n_updates            | 1790         |
|    policy_gradient_loss | -0.00269     |
|    std                  | 0.81         |
|    value_loss           | 2.43e+05     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.71e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 181         |
|    time_elapsed         | 2534        |
|    total_timesteps      | 370688      |
| train/                  |             |
|    approx_kl            | 0.004950725 |
|    clip_fraction        | 0.0298      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 3.29e+04    |
|    n_updates            | 1800        |
|    policy_gradient_loss | -0.00428    |
|    std                  | 0.808       |
|    value_loss           | 9.81e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.69e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 182          |
|    time_elapsed         | 2548         |
|    total_timesteps      | 372736       |
| train/                  |              |
|    approx_kl            | 0.0062711835 |
|    clip_fraction        | 0.0457       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 9.28e+04     |
|    n_updates            | 1810         |
|    policy_gradient_loss | -0.00529     |
|    std                  | 0.804        |
|    value_loss           | 2.42e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.72e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 183        |
|    time_elapsed         | 2562       |
|    total_timesteps      | 374784     |
| train/                  |            |
|    approx_kl            | 0.03769949 |
|    clip_fraction        | 0.276      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.39      |
|    explained_variance   | -1.19e-07  |
|    learning_rate        | 0.0003     |
|    loss                 | 4.11e+03   |
|    n_updates            | 1820       |
|    policy_gradient_loss | 0.017      |
|    std                  | 0.803      |
|    value_loss           | 1.27e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.71e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 184          |
|    time_elapsed         | 2577         |
|    total_timesteps      | 376832       |
| train/                  |              |
|    approx_kl            | 0.0017561743 |
|    clip_fraction        | 0.0173       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.12e+05     |
|    n_updates            | 1830         |
|    policy_gradient_loss | -0.0024      |
|    std                  | 0.804        |
|    value_loss           | 2.6e+05      |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.72e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 185         |
|    time_elapsed         | 2591        |
|    total_timesteps      | 378880      |
| train/                  |             |
|    approx_kl            | 0.112695605 |
|    clip_fraction        | 0.332       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.72e+03    |
|    n_updates            | 1840        |
|    policy_gradient_loss | 0.0256      |
|    std                  | 0.814       |
|    value_loss           | 1.46e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.71e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 186          |
|    time_elapsed         | 2605         |
|    total_timesteps      | 380928       |
| train/                  |              |
|    approx_kl            | 0.0053791683 |
|    clip_fraction        | 0.0456       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 6.82e+04     |
|    n_updates            | 1850         |
|    policy_gradient_loss | -0.00408     |
|    std                  | 0.814        |
|    value_loss           | 1.39e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.7e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 187         |
|    time_elapsed         | 2619        |
|    total_timesteps      | 382976      |
| train/                  |             |
|    approx_kl            | 0.010274031 |
|    clip_fraction        | 0.294       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.42       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.92e+03    |
|    n_updates            | 1860        |
|    policy_gradient_loss | 0.0151      |
|    std                  | 0.809       |
|    value_loss           | 1.58e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.7e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 188          |
|    time_elapsed         | 2633         |
|    total_timesteps      | 385024       |
| train/                  |              |
|    approx_kl            | 0.0063446662 |
|    clip_fraction        | 0.0343       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.59e+04     |
|    n_updates            | 1870         |
|    policy_gradient_loss | -0.00318     |
|    std                  | 0.808        |
|    value_loss           | 5.11e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.69e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 189         |
|    time_elapsed         | 2647        |
|    total_timesteps      | 387072      |
| train/                  |             |
|    approx_kl            | 0.001311849 |
|    clip_fraction        | 0.00337     |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.88e+04    |
|    n_updates            | 1880        |
|    policy_gradient_loss | -0.0015     |
|    std                  | 0.808       |
|    value_loss           | 6.04e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.7e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 190          |
|    time_elapsed         | 2661         |
|    total_timesteps      | 389120       |
| train/                  |              |
|    approx_kl            | 0.0020473837 |
|    clip_fraction        | 0.00845      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.45e+04     |
|    n_updates            | 1890         |
|    policy_gradient_loss | -0.000309    |
|    std                  | 0.808        |
|    value_loss           | 3.35e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.68e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 191          |
|    time_elapsed         | 2675         |
|    total_timesteps      | 391168       |
| train/                  |              |
|    approx_kl            | 0.0038499257 |
|    clip_fraction        | 0.0162       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 6.08e+04     |
|    n_updates            | 1900         |
|    policy_gradient_loss | -0.00169     |
|    std                  | 0.809        |
|    value_loss           | 1.22e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.68e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 192          |
|    time_elapsed         | 2689         |
|    total_timesteps      | 393216       |
| train/                  |              |
|    approx_kl            | 0.0040635746 |
|    clip_fraction        | 0.0566       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 749          |
|    n_updates            | 1910         |
|    policy_gradient_loss | 0.00125      |
|    std                  | 0.8          |
|    value_loss           | 6.02e+03     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.69e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 193          |
|    time_elapsed         | 2703         |
|    total_timesteps      | 395264       |
| train/                  |              |
|    approx_kl            | 0.0049852952 |
|    clip_fraction        | 0.0297       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 4.81e+04     |
|    n_updates            | 1920         |
|    policy_gradient_loss | -0.00322     |
|    std                  | 0.798        |
|    value_loss           | 8.63e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.64e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 194          |
|    time_elapsed         | 2717         |
|    total_timesteps      | 397312       |
| train/                  |              |
|    approx_kl            | 0.0051691593 |
|    clip_fraction        | 0.0332       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.07e+05     |
|    n_updates            | 1930         |
|    policy_gradient_loss | -0.00202     |
|    std                  | 0.797        |
|    value_loss           | 2.04e+05     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.65e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 195         |
|    time_elapsed         | 2730        |
|    total_timesteps      | 399360      |
| train/                  |             |
|    approx_kl            | 0.029682703 |
|    clip_fraction        | 0.232       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.45e+03    |
|    n_updates            | 1940        |
|    policy_gradient_loss | 0.00683     |
|    std                  | 0.802       |
|    value_loss           | 1.23e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.65e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 196          |
|    time_elapsed         | 2745         |
|    total_timesteps      | 401408       |
| train/                  |              |
|    approx_kl            | 0.0015565101 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.25e+05     |
|    n_updates            | 1950         |
|    policy_gradient_loss | -0.000973    |
|    std                  | 0.803        |
|    value_loss           | 2.14e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.61e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 197          |
|    time_elapsed         | 2759         |
|    total_timesteps      | 403456       |
| train/                  |              |
|    approx_kl            | 0.0031888187 |
|    clip_fraction        | 0.0339       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 3.59e+04     |
|    n_updates            | 1960         |
|    policy_gradient_loss | -0.00151     |
|    std                  | 0.799        |
|    value_loss           | 7.24e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.58e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 198          |
|    time_elapsed         | 2773         |
|    total_timesteps      | 405504       |
| train/                  |              |
|    approx_kl            | 0.0026603849 |
|    clip_fraction        | 0.0128       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.31e+04     |
|    n_updates            | 1970         |
|    policy_gradient_loss | -0.00043     |
|    std                  | 0.799        |
|    value_loss           | 1.3e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.54e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 199         |
|    time_elapsed         | 2786        |
|    total_timesteps      | 407552      |
| train/                  |             |
|    approx_kl            | 0.010369105 |
|    clip_fraction        | 0.222       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.18e+04    |
|    n_updates            | 1980        |
|    policy_gradient_loss | 0.00338     |
|    std                  | 0.811       |
|    value_loss           | 6.25e+03    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.52e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 200          |
|    time_elapsed         | 2800         |
|    total_timesteps      | 409600       |
| train/                  |              |
|    approx_kl            | 0.0053892815 |
|    clip_fraction        | 0.0947       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 9.45e+03     |
|    n_updates            | 1990         |
|    policy_gradient_loss | -0.00246     |
|    std                  | 0.809        |
|    value_loss           | 2.89e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.51e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 201          |
|    time_elapsed         | 2814         |
|    total_timesteps      | 411648       |
| train/                  |              |
|    approx_kl            | 0.0005793912 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.87e+04     |
|    n_updates            | 2000         |
|    policy_gradient_loss | -0.00027     |
|    std                  | 0.809        |
|    value_loss           | 7.86e+04     |
------------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.49e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 202           |
|    time_elapsed         | 2828          |
|    total_timesteps      | 413696        |
| train/                  |               |
|    approx_kl            | 0.00032858778 |
|    clip_fraction        | 9.77e-05      |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0             |
|    learning_rate        | 0.0003        |
|    loss                 | 3.17e+04      |
|    n_updates            | 2010          |
|    policy_gradient_loss | -0.000896     |
|    std                  | 0.809         |
|    value_loss           | 7.33e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.49e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 203          |
|    time_elapsed         | 2842         |
|    total_timesteps      | 415744       |
| train/                  |              |
|    approx_kl            | 0.0017202175 |
|    clip_fraction        | 0.00449      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -2.38e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.14e+04     |
|    n_updates            | 2020         |
|    policy_gradient_loss | -0.000631    |
|    std                  | 0.81         |
|    value_loss           | 2.05e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.45e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 204         |
|    time_elapsed         | 2856        |
|    total_timesteps      | 417792      |
| train/                  |             |
|    approx_kl            | 0.046429716 |
|    clip_fraction        | 0.167       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.88e+04    |
|    n_updates            | 2030        |
|    policy_gradient_loss | 0.00882     |
|    std                  | 0.804       |
|    value_loss           | 3.4e+04     |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.44e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 205          |
|    time_elapsed         | 2870         |
|    total_timesteps      | 419840       |
| train/                  |              |
|    approx_kl            | 0.0034502659 |
|    clip_fraction        | 0.109        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 9.04e+03     |
|    n_updates            | 2040         |
|    policy_gradient_loss | 0.00265      |
|    std                  | 0.797        |
|    value_loss           | 1.39e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.46e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 206          |
|    time_elapsed         | 2883         |
|    total_timesteps      | 421888       |
| train/                  |              |
|    approx_kl            | 0.0037220747 |
|    clip_fraction        | 0.0311       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.32e+04     |
|    n_updates            | 2050         |
|    policy_gradient_loss | -0.00105     |
|    std                  | 0.796        |
|    value_loss           | 5.83e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.44e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 207          |
|    time_elapsed         | 2897         |
|    total_timesteps      | 423936       |
| train/                  |              |
|    approx_kl            | 0.0004281234 |
|    clip_fraction        | 0.000293     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 3.34e+04     |
|    n_updates            | 2060         |
|    policy_gradient_loss | -0.000554    |
|    std                  | 0.796        |
|    value_loss           | 9.22e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.43e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 208         |
|    time_elapsed         | 2911        |
|    total_timesteps      | 425984      |
| train/                  |             |
|    approx_kl            | 0.028351426 |
|    clip_fraction        | 0.161       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.21e+03    |
|    n_updates            | 2070        |
|    policy_gradient_loss | 0.00645     |
|    std                  | 0.804       |
|    value_loss           | 1.54e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.41e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 209           |
|    time_elapsed         | 2926          |
|    total_timesteps      | 428032        |
| train/                  |               |
|    approx_kl            | 0.00055873254 |
|    clip_fraction        | 0.00405       |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.4          |
|    explained_variance   | 5.96e-08      |
|    learning_rate        | 0.0003        |
|    loss                 | 5.4e+04       |
|    n_updates            | 2080          |
|    policy_gradient_loss | 0.000205      |
|    std                  | 0.804         |
|    value_loss           | 9.32e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.41e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 210          |
|    time_elapsed         | 2940         |
|    total_timesteps      | 430080       |
| train/                  |              |
|    approx_kl            | 0.0024209775 |
|    clip_fraction        | 0.00566      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 5.19e+03     |
|    n_updates            | 2090         |
|    policy_gradient_loss | -0.000807    |
|    std                  | 0.804        |
|    value_loss           | 1.16e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.37e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 211           |
|    time_elapsed         | 2953          |
|    total_timesteps      | 432128        |
| train/                  |               |
|    approx_kl            | 0.00040300813 |
|    clip_fraction        | 0.00166       |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.4          |
|    explained_variance   | 0             |
|    learning_rate        | 0.0003        |
|    loss                 | 2.68e+04      |
|    n_updates            | 2100          |
|    policy_gradient_loss | -0.00108      |
|    std                  | 0.804         |
|    value_loss           | 6.24e+04      |
-------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.36e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 212         |
|    time_elapsed         | 2967        |
|    total_timesteps      | 434176      |
| train/                  |             |
|    approx_kl            | 0.015826616 |
|    clip_fraction        | 0.182       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 246         |
|    n_updates            | 2110        |
|    policy_gradient_loss | 0.00561     |
|    std                  | 0.808       |
|    value_loss           | 1.35e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.36e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 213         |
|    time_elapsed         | 2981        |
|    total_timesteps      | 436224      |
| train/                  |             |
|    approx_kl            | 0.012660749 |
|    clip_fraction        | 0.101       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.59e+03    |
|    n_updates            | 2120        |
|    policy_gradient_loss | 0.000261    |
|    std                  | 0.811       |
|    value_loss           | 1.27e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.34e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 214          |
|    time_elapsed         | 2995         |
|    total_timesteps      | 438272       |
| train/                  |              |
|    approx_kl            | 0.0036898132 |
|    clip_fraction        | 0.00488      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.2e+04      |
|    n_updates            | 2130         |
|    policy_gradient_loss | -0.00151     |
|    std                  | 0.812        |
|    value_loss           | 2.93e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 215          |
|    time_elapsed         | 3009         |
|    total_timesteps      | 440320       |
| train/                  |              |
|    approx_kl            | 0.0035534608 |
|    clip_fraction        | 0.0886       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.25e+03     |
|    n_updates            | 2140         |
|    policy_gradient_loss | 0.0017       |
|    std                  | 0.807        |
|    value_loss           | 1.61e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.34e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 216         |
|    time_elapsed         | 3023        |
|    total_timesteps      | 442368      |
| train/                  |             |
|    approx_kl            | 0.012538008 |
|    clip_fraction        | 0.15        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 3.45e+03    |
|    n_updates            | 2150        |
|    policy_gradient_loss | 9.65e-05    |
|    std                  | 0.809       |
|    value_loss           | 7.32e+03    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.35e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 217          |
|    time_elapsed         | 3037         |
|    total_timesteps      | 444416       |
| train/                  |              |
|    approx_kl            | 0.0019840915 |
|    clip_fraction        | 0.0177       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.000356    |
|    learning_rate        | 0.0003       |
|    loss                 | 2.69e+04     |
|    n_updates            | 2160         |
|    policy_gradient_loss | -0.000967    |
|    std                  | 0.809        |
|    value_loss           | 3.04e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 218         |
|    time_elapsed         | 3051        |
|    total_timesteps      | 446464      |
| train/                  |             |
|    approx_kl            | 0.001042171 |
|    clip_fraction        | 0.000781    |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.1e+04     |
|    n_updates            | 2170        |
|    policy_gradient_loss | -0.00139    |
|    std                  | 0.809       |
|    value_loss           | 3.16e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.35e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 219          |
|    time_elapsed         | 3065         |
|    total_timesteps      | 448512       |
| train/                  |              |
|    approx_kl            | 0.0033211915 |
|    clip_fraction        | 0.0119       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.18e+04     |
|    n_updates            | 2180         |
|    policy_gradient_loss | -0.00112     |
|    std                  | 0.81         |
|    value_loss           | 1.92e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.33e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 220         |
|    time_elapsed         | 3080        |
|    total_timesteps      | 450560      |
| train/                  |             |
|    approx_kl            | 0.003660666 |
|    clip_fraction        | 0.0357      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 4.07e+03    |
|    n_updates            | 2190        |
|    policy_gradient_loss | -1.56e-05   |
|    std                  | 0.809       |
|    value_loss           | 1.39e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 221          |
|    time_elapsed         | 3094         |
|    total_timesteps      | 452608       |
| train/                  |              |
|    approx_kl            | 0.0108067915 |
|    clip_fraction        | 0.129        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.08e+04     |
|    n_updates            | 2200         |
|    policy_gradient_loss | 0.00199      |
|    std                  | 0.806        |
|    value_loss           | 1.67e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 222          |
|    time_elapsed         | 3108         |
|    total_timesteps      | 454656       |
| train/                  |              |
|    approx_kl            | 0.0047326735 |
|    clip_fraction        | 0.0202       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 9.75e+03     |
|    n_updates            | 2210         |
|    policy_gradient_loss | -0.00268     |
|    std                  | 0.807        |
|    value_loss           | 2.33e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 223          |
|    time_elapsed         | 3122         |
|    total_timesteps      | 456704       |
| train/                  |              |
|    approx_kl            | 0.0014149009 |
|    clip_fraction        | 0.00132      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.72e+04     |
|    n_updates            | 2220         |
|    policy_gradient_loss | -0.00202     |
|    std                  | 0.807        |
|    value_loss           | 3.66e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.34e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 224          |
|    time_elapsed         | 3136         |
|    total_timesteps      | 458752       |
| train/                  |              |
|    approx_kl            | 0.0013034248 |
|    clip_fraction        | 0.0357       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 2.16e+04     |
|    n_updates            | 2230         |
|    policy_gradient_loss | 0.00152      |
|    std                  | 0.807        |
|    value_loss           | 2.69e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.32e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 225          |
|    time_elapsed         | 3150         |
|    total_timesteps      | 460800       |
| train/                  |              |
|    approx_kl            | 0.0039016686 |
|    clip_fraction        | 0.00903      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.09e+04     |
|    n_updates            | 2240         |
|    policy_gradient_loss | -0.00199     |
|    std                  | 0.807        |
|    value_loss           | 3.81e+04     |
------------------------------------------


INFO:root:done


---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 1.2e+03   |
|    ep_rew_mean          | 2.32e+04  |
| time/                   |           |
|    fps                  | 146       |
|    iterations           | 226       |
|    time_elapsed         | 3165      |
|    total_timesteps      | 462848    |
| train/                  |           |
|    approx_kl            | 0.0084801 |
|    clip_fraction        | 0.13      |
|    clip_range           | 0.2       |
|    entropy_loss         | -2.4      |
|    explained_variance   | 1.19e-07  |
|    learning_rate        | 0.0003    |
|    loss                 | 6e+03     |
|    n_updates            | 2250      |
|    policy_gradient_loss | 0.00199   |
|    std                  | 0.808     |
|    value_loss           | 2.17e+04  |
---------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.31e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 227           |
|    time_elapsed         | 3179          |
|    total_timesteps      | 464896        |
| train/                  |               |
|    approx_kl            | 0.00023483767 |
|    clip_fraction        | 0.000146      |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0             |
|    learning_rate        | 0.0003        |
|    loss                 | 2.13e+04      |
|    n_updates            | 2260          |
|    policy_gradient_loss | -0.000311     |
|    std                  | 0.808         |
|    value_loss           | 4.64e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.32e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 228         |
|    time_elapsed         | 3194        |
|    total_timesteps      | 466944      |
| train/                  |             |
|    approx_kl            | 0.003948936 |
|    clip_fraction        | 0.0161      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.05e+04    |
|    n_updates            | 2270        |
|    policy_gradient_loss | -0.00127    |
|    std                  | 0.808       |
|    value_loss           | 2.96e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.32e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 229          |
|    time_elapsed         | 3207         |
|    total_timesteps      | 468992       |
| train/                  |              |
|    approx_kl            | 0.0038660553 |
|    clip_fraction        | 0.0431       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.15e+04     |
|    n_updates            | 2280         |
|    policy_gradient_loss | 0.000561     |
|    std                  | 0.812        |
|    value_loss           | 2.38e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.32e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 230          |
|    time_elapsed         | 3222         |
|    total_timesteps      | 471040       |
| train/                  |              |
|    approx_kl            | 0.0028741036 |
|    clip_fraction        | 0.00298      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.35e+04     |
|    n_updates            | 2290         |
|    policy_gradient_loss | -0.000437    |
|    std                  | 0.813        |
|    value_loss           | 3.84e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 231          |
|    time_elapsed         | 3236         |
|    total_timesteps      | 473088       |
| train/                  |              |
|    approx_kl            | 0.0040713735 |
|    clip_fraction        | 0.018        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.46e+04     |
|    n_updates            | 2300         |
|    policy_gradient_loss | -0.00247     |
|    std                  | 0.811        |
|    value_loss           | 4.17e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.33e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 232         |
|    time_elapsed         | 3249        |
|    total_timesteps      | 475136      |
| train/                  |             |
|    approx_kl            | 0.003803351 |
|    clip_fraction        | 0.0143      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.13e+04    |
|    n_updates            | 2310        |
|    policy_gradient_loss | -0.00162    |
|    std                  | 0.81        |
|    value_loss           | 5.85e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 233         |
|    time_elapsed         | 3264        |
|    total_timesteps      | 477184      |
| train/                  |             |
|    approx_kl            | 0.003550175 |
|    clip_fraction        | 0.00645     |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.27e+04    |
|    n_updates            | 2320        |
|    policy_gradient_loss | -0.00135    |
|    std                  | 0.808       |
|    value_loss           | 9.78e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 234         |
|    time_elapsed         | 3278        |
|    total_timesteps      | 479232      |
| train/                  |             |
|    approx_kl            | 0.004422415 |
|    clip_fraction        | 0.0224      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.78e+04    |
|    n_updates            | 2330        |
|    policy_gradient_loss | -0.00225    |
|    std                  | 0.81        |
|    value_loss           | 4.07e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.38e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 235         |
|    time_elapsed         | 3292        |
|    total_timesteps      | 481280      |
| train/                  |             |
|    approx_kl            | 0.005243501 |
|    clip_fraction        | 0.0271      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 2.62e+04    |
|    n_updates            | 2340        |
|    policy_gradient_loss | -0.00261    |
|    std                  | 0.808       |
|    value_loss           | 6.23e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.38e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 236          |
|    time_elapsed         | 3307         |
|    total_timesteps      | 483328       |
| train/                  |              |
|    approx_kl            | 0.0031656963 |
|    clip_fraction        | 0.00898      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 3.83e+04     |
|    n_updates            | 2350         |
|    policy_gradient_loss | -0.00145     |
|    std                  | 0.805        |
|    value_loss           | 8.18e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.38e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 237        |
|    time_elapsed         | 3321       |
|    total_timesteps      | 485376     |
| train/                  |            |
|    approx_kl            | 0.02401856 |
|    clip_fraction        | 0.148      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.4       |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 4.8e+03    |
|    n_updates            | 2360       |
|    policy_gradient_loss | 0.00311    |
|    std                  | 0.807      |
|    value_loss           | 1.74e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.34e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 238          |
|    time_elapsed         | 3335         |
|    total_timesteps      | 487424       |
| train/                  |              |
|    approx_kl            | 0.0060438355 |
|    clip_fraction        | 0.0741       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.06e+04     |
|    n_updates            | 2370         |
|    policy_gradient_loss | -0.00169     |
|    std                  | 0.807        |
|    value_loss           | 3.13e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.33e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 239         |
|    time_elapsed         | 3349        |
|    total_timesteps      | 489472      |
| train/                  |             |
|    approx_kl            | 0.018512787 |
|    clip_fraction        | 0.191       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.81e+03    |
|    n_updates            | 2380        |
|    policy_gradient_loss | 0.00743     |
|    std                  | 0.81        |
|    value_loss           | 1.83e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.3e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 240          |
|    time_elapsed         | 3363         |
|    total_timesteps      | 491520       |
| train/                  |              |
|    approx_kl            | 0.0036351169 |
|    clip_fraction        | 0.00693      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.18e+04     |
|    n_updates            | 2390         |
|    policy_gradient_loss | 0.000194     |
|    std                  | 0.811        |
|    value_loss           | 1.35e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.29e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 241          |
|    time_elapsed         | 3378         |
|    total_timesteps      | 493568       |
| train/                  |              |
|    approx_kl            | 0.0012722991 |
|    clip_fraction        | 0.0724       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | -2.38e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 4.58e+03     |
|    n_updates            | 2400         |
|    policy_gradient_loss | 0.00193      |
|    std                  | 0.821        |
|    value_loss           | 1.83e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.26e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 242         |
|    time_elapsed         | 3391        |
|    total_timesteps      | 495616      |
| train/                  |             |
|    approx_kl            | 0.007410402 |
|    clip_fraction        | 0.127       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.23e+04    |
|    n_updates            | 2410        |
|    policy_gradient_loss | -8.05e-05   |
|    std                  | 0.82        |
|    value_loss           | 1.77e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.26e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 243          |
|    time_elapsed         | 3406         |
|    total_timesteps      | 497664       |
| train/                  |              |
|    approx_kl            | 0.0041202432 |
|    clip_fraction        | 0.0963       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.45e+03     |
|    n_updates            | 2420         |
|    policy_gradient_loss | 0.00295      |
|    std                  | 0.816        |
|    value_loss           | 1.72e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.24e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 244          |
|    time_elapsed         | 3419         |
|    total_timesteps      | 499712       |
| train/                  |              |
|    approx_kl            | 0.0060717333 |
|    clip_fraction        | 0.0815       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.66e+03     |
|    n_updates            | 2430         |
|    policy_gradient_loss | 0.00202      |
|    std                  | 0.809        |
|    value_loss           | 1.02e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.23e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 245         |
|    time_elapsed         | 3433        |
|    total_timesteps      | 501760      |
| train/                  |             |
|    approx_kl            | 0.009494521 |
|    clip_fraction        | 0.0968      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.67e-06   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.33e+04    |
|    n_updates            | 2440        |
|    policy_gradient_loss | 0.00231     |
|    std                  | 0.808       |
|    value_loss           | 2.07e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.23e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 246          |
|    time_elapsed         | 3447         |
|    total_timesteps      | 503808       |
| train/                  |              |
|    approx_kl            | 0.0074363374 |
|    clip_fraction        | 0.113        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 4.9e+03      |
|    n_updates            | 2450         |
|    policy_gradient_loss | -0.00458     |
|    std                  | 0.809        |
|    value_loss           | 1.94e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.22e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 247           |
|    time_elapsed         | 3462          |
|    total_timesteps      | 505856        |
| train/                  |               |
|    approx_kl            | 0.00016550135 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.0293        |
|    learning_rate        | 0.0003        |
|    loss                 | 1.98e+03      |
|    n_updates            | 2460          |
|    policy_gradient_loss | -0.000727     |
|    std                  | 0.809         |
|    value_loss           | 1.2e+04       |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.22e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 248          |
|    time_elapsed         | 3476         |
|    total_timesteps      | 507904       |
| train/                  |              |
|    approx_kl            | 7.399553e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.00365      |
|    learning_rate        | 0.0003       |
|    loss                 | 3.81e+03     |
|    n_updates            | 2470         |
|    policy_gradient_loss | -0.00032     |
|    std                  | 0.809        |
|    value_loss           | 1.85e+04     |
------------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.2e+04       |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 249           |
|    time_elapsed         | 3491          |
|    total_timesteps      | 509952        |
| train/                  |               |
|    approx_kl            | 3.3023127e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.0456        |
|    learning_rate        | 0.0003        |
|    loss                 | 5.78e+03      |
|    n_updates            | 2480          |
|    policy_gradient_loss | -0.000183     |
|    std                  | 0.809         |
|    value_loss           | 1.76e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.2e+04       |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 250           |
|    time_elapsed         | 3506          |
|    total_timesteps      | 512000        |
| train/                  |               |
|    approx_kl            | 0.00059629336 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.0449        |
|    learning_rate        | 0.0003        |
|    loss                 | 2.57e+03      |
|    n_updates            | 2490          |
|    policy_gradient_loss | -0.00111      |
|    std                  | 0.809         |
|    value_loss           | 1.22e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 251          |
|    time_elapsed         | 3519         |
|    total_timesteps      | 514048       |
| train/                  |              |
|    approx_kl            | 0.0009990113 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.0359      |
|    learning_rate        | 0.0003       |
|    loss                 | 812          |
|    n_updates            | 2500         |
|    policy_gradient_loss | -0.00156     |
|    std                  | 0.809        |
|    value_loss           | 1.52e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.17e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 252          |
|    time_elapsed         | 3533         |
|    total_timesteps      | 516096       |
| train/                  |              |
|    approx_kl            | 0.0003530182 |
|    clip_fraction        | 4.88e-05     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.0463       |
|    learning_rate        | 0.0003       |
|    loss                 | 892          |
|    n_updates            | 2510         |
|    policy_gradient_loss | -0.000284    |
|    std                  | 0.809        |
|    value_loss           | 1.64e+04     |
------------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.18e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 253           |
|    time_elapsed         | 3547          |
|    total_timesteps      | 518144        |
| train/                  |               |
|    approx_kl            | 0.00089185615 |
|    clip_fraction        | 0.000879      |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.103         |
|    learning_rate        | 0.0003        |
|    loss                 | 2.46e+03      |
|    n_updates            | 2520          |
|    policy_gradient_loss | -0.000789     |
|    std                  | 0.809         |
|    value_loss           | 1.8e+04       |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.13e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 254          |
|    time_elapsed         | 3561         |
|    total_timesteps      | 520192       |
| train/                  |              |
|    approx_kl            | 0.0028053296 |
|    clip_fraction        | 0.00186      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.368        |
|    learning_rate        | 0.0003       |
|    loss                 | 9.63e+03     |
|    n_updates            | 2530         |
|    policy_gradient_loss | -0.000788    |
|    std                  | 0.81         |
|    value_loss           | 1.33e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.14e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 255          |
|    time_elapsed         | 3575         |
|    total_timesteps      | 522240       |
| train/                  |              |
|    approx_kl            | 0.0039466303 |
|    clip_fraction        | 0.0203       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.0361      |
|    learning_rate        | 0.0003       |
|    loss                 | 2.19e+03     |
|    n_updates            | 2540         |
|    policy_gradient_loss | 0.000274     |
|    std                  | 0.809        |
|    value_loss           | 1.9e+04      |
------------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.15e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 256           |
|    time_elapsed         | 3589          |
|    total_timesteps      | 524288        |
| train/                  |               |
|    approx_kl            | 0.00028643274 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.0213        |
|    learning_rate        | 0.0003        |
|    loss                 | 6.52e+03      |
|    n_updates            | 2550          |
|    policy_gradient_loss | 8.64e-05      |
|    std                  | 0.809         |
|    value_loss           | 1.88e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 257          |
|    time_elapsed         | 3603         |
|    total_timesteps      | 526336       |
| train/                  |              |
|    approx_kl            | 0.0022042603 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.089       |
|    learning_rate        | 0.0003       |
|    loss                 | 775          |
|    n_updates            | 2560         |
|    policy_gradient_loss | -0.000991    |
|    std                  | 0.809        |
|    value_loss           | 8.67e+03     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.15e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 258          |
|    time_elapsed         | 3617         |
|    total_timesteps      | 528384       |
| train/                  |              |
|    approx_kl            | 0.0015742909 |
|    clip_fraction        | 9.77e-05     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.00236      |
|    learning_rate        | 0.0003       |
|    loss                 | 2.01e+04     |
|    n_updates            | 2570         |
|    policy_gradient_loss | -0.000447    |
|    std                  | 0.809        |
|    value_loss           | 2.96e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.15e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 259          |
|    time_elapsed         | 3631         |
|    total_timesteps      | 530432       |
| train/                  |              |
|    approx_kl            | 0.0011505384 |
|    clip_fraction        | 4.88e-05     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.0671       |
|    learning_rate        | 0.0003       |
|    loss                 | 5.94e+03     |
|    n_updates            | 2580         |
|    policy_gradient_loss | 5.33e-05     |
|    std                  | 0.81         |
|    value_loss           | 2.46e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.15e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 260          |
|    time_elapsed         | 3645         |
|    total_timesteps      | 532480       |
| train/                  |              |
|    approx_kl            | 0.0020698789 |
|    clip_fraction        | 0.00186      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.0463       |
|    learning_rate        | 0.0003       |
|    loss                 | 3.04e+04     |
|    n_updates            | 2590         |
|    policy_gradient_loss | -0.000916    |
|    std                  | 0.808        |
|    value_loss           | 3.13e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.15e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 261          |
|    time_elapsed         | 3659         |
|    total_timesteps      | 534528       |
| train/                  |              |
|    approx_kl            | 0.0019356541 |
|    clip_fraction        | 0.000439     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.105        |
|    learning_rate        | 0.0003       |
|    loss                 | 3.13e+04     |
|    n_updates            | 2600         |
|    policy_gradient_loss | -0.00123     |
|    std                  | 0.809        |
|    value_loss           | 3.38e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.16e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 262         |
|    time_elapsed         | 3673        |
|    total_timesteps      | 536576      |
| train/                  |             |
|    approx_kl            | 0.002667516 |
|    clip_fraction        | 0.00283     |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0.0638      |
|    learning_rate        | 0.0003      |
|    loss                 | 1.07e+04    |
|    n_updates            | 2610        |
|    policy_gradient_loss | -0.000874   |
|    std                  | 0.808       |
|    value_loss           | 2.81e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 263          |
|    time_elapsed         | 3687         |
|    total_timesteps      | 538624       |
| train/                  |              |
|    approx_kl            | 0.0012219141 |
|    clip_fraction        | 4.88e-05     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.00145     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.06e+03     |
|    n_updates            | 2620         |
|    policy_gradient_loss | -0.000616    |
|    std                  | 0.808        |
|    value_loss           | 1.75e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.17e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 264         |
|    time_elapsed         | 3700        |
|    total_timesteps      | 540672      |
| train/                  |             |
|    approx_kl            | 0.005010533 |
|    clip_fraction        | 0.0207      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -0.147      |
|    learning_rate        | 0.0003      |
|    loss                 | 7.37e+03    |
|    n_updates            | 2630        |
|    policy_gradient_loss | -0.00171    |
|    std                  | 0.806       |
|    value_loss           | 1.31e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.17e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 265          |
|    time_elapsed         | 3714         |
|    total_timesteps      | 542720       |
| train/                  |              |
|    approx_kl            | 0.0048290873 |
|    clip_fraction        | 0.0277       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -0.00296     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.21e+04     |
|    n_updates            | 2640         |
|    policy_gradient_loss | -0.00252     |
|    std                  | 0.805        |
|    value_loss           | 4.99e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.18e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 266         |
|    time_elapsed         | 3727        |
|    total_timesteps      | 544768      |
| train/                  |             |
|    approx_kl            | 0.003666722 |
|    clip_fraction        | 0.0182      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0.000949    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.45e+04    |
|    n_updates            | 2650        |
|    policy_gradient_loss | -0.00188    |
|    std                  | 0.807       |
|    value_loss           | 4.53e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.17e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 267          |
|    time_elapsed         | 3741         |
|    total_timesteps      | 546816       |
| train/                  |              |
|    approx_kl            | 0.0023065237 |
|    clip_fraction        | 0.00718      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.0564      |
|    learning_rate        | 0.0003       |
|    loss                 | 1.37e+04     |
|    n_updates            | 2660         |
|    policy_gradient_loss | -0.00142     |
|    std                  | 0.806        |
|    value_loss           | 3.46e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.19e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 268          |
|    time_elapsed         | 3755         |
|    total_timesteps      | 548864       |
| train/                  |              |
|    approx_kl            | 0.0022016664 |
|    clip_fraction        | 0.0953       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 1.13e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 9.75e+03     |
|    n_updates            | 2670         |
|    policy_gradient_loss | 0.00357      |
|    std                  | 0.818        |
|    value_loss           | 2.46e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.2e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 269          |
|    time_elapsed         | 3769         |
|    total_timesteps      | 550912       |
| train/                  |              |
|    approx_kl            | 0.0034754355 |
|    clip_fraction        | 0.00435      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.44        |
|    explained_variance   | 5.17e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 1.39e+04     |
|    n_updates            | 2680         |
|    policy_gradient_loss | -0.000553    |
|    std                  | 0.821        |
|    value_loss           | 4.52e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.2e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 270         |
|    time_elapsed         | 3783        |
|    total_timesteps      | 552960      |
| train/                  |             |
|    approx_kl            | 0.003219577 |
|    clip_fraction        | 0.0194      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | 8.4e-06     |
|    learning_rate        | 0.0003      |
|    loss                 | 1.15e+04    |
|    n_updates            | 2690        |
|    policy_gradient_loss | -0.00137    |
|    std                  | 0.824       |
|    value_loss           | 3.43e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.21e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 271          |
|    time_elapsed         | 3797         |
|    total_timesteps      | 555008       |
| train/                  |              |
|    approx_kl            | 0.0036321243 |
|    clip_fraction        | 0.0465       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | -2e-05       |
|    learning_rate        | 0.0003       |
|    loss                 | 6.58e+03     |
|    n_updates            | 2700         |
|    policy_gradient_loss | 0.00056      |
|    std                  | 0.825        |
|    value_loss           | 1.69e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.21e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 272          |
|    time_elapsed         | 3811         |
|    total_timesteps      | 557056       |
| train/                  |              |
|    approx_kl            | 0.0023997384 |
|    clip_fraction        | 0.0219       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | 3.99e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 5.82e+03     |
|    n_updates            | 2710         |
|    policy_gradient_loss | -0.000638    |
|    std                  | 0.83         |
|    value_loss           | 2.49e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.21e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 273          |
|    time_elapsed         | 3825         |
|    total_timesteps      | 559104       |
| train/                  |              |
|    approx_kl            | 0.0010495745 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | 0.014        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.08e+04     |
|    n_updates            | 2720         |
|    policy_gradient_loss | -0.000137    |
|    std                  | 0.829        |
|    value_loss           | 3.1e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.23e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 274          |
|    time_elapsed         | 3838         |
|    total_timesteps      | 561152       |
| train/                  |              |
|    approx_kl            | 0.0056377756 |
|    clip_fraction        | 0.0311       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | -0.013       |
|    learning_rate        | 0.0003       |
|    loss                 | 5.11e+03     |
|    n_updates            | 2730         |
|    policy_gradient_loss | -0.00175     |
|    std                  | 0.826        |
|    value_loss           | 1.65e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.23e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 275          |
|    time_elapsed         | 3852         |
|    total_timesteps      | 563200       |
| train/                  |              |
|    approx_kl            | 0.0036554735 |
|    clip_fraction        | 0.0174       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | 1.42e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 5.65e+03     |
|    n_updates            | 2740         |
|    policy_gradient_loss | 1.51e-05     |
|    std                  | 0.824        |
|    value_loss           | 2.55e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.22e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 276         |
|    time_elapsed         | 3866        |
|    total_timesteps      | 565248      |
| train/                  |             |
|    approx_kl            | 0.004131675 |
|    clip_fraction        | 0.0364      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | -7.01e-05   |
|    learning_rate        | 0.0003      |
|    loss                 | 5.43e+03    |
|    n_updates            | 2750        |
|    policy_gradient_loss | -0.00184    |
|    std                  | 0.823       |
|    value_loss           | 2.59e+04    |
-----------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.22e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 277           |
|    time_elapsed         | 3880          |
|    total_timesteps      | 567296        |
| train/                  |               |
|    approx_kl            | 0.00059960736 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.45         |
|    explained_variance   | -0.00831      |
|    learning_rate        | 0.0003        |
|    loss                 | 1.94e+04      |
|    n_updates            | 2760          |
|    policy_gradient_loss | 0.000218      |
|    std                  | 0.824         |
|    value_loss           | 2.32e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.22e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 278          |
|    time_elapsed         | 3894         |
|    total_timesteps      | 569344       |
| train/                  |              |
|    approx_kl            | 0.0057934704 |
|    clip_fraction        | 0.0404       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | -0.0353      |
|    learning_rate        | 0.0003       |
|    loss                 | 1.35e+03     |
|    n_updates            | 2770         |
|    policy_gradient_loss | -0.00238     |
|    std                  | 0.824        |
|    value_loss           | 1.19e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.23e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 279        |
|    time_elapsed         | 3907       |
|    total_timesteps      | 571392     |
| train/                  |            |
|    approx_kl            | 0.00539076 |
|    clip_fraction        | 0.00923    |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.45      |
|    explained_variance   | 0.0833     |
|    learning_rate        | 0.0003     |
|    loss                 | 1.64e+04   |
|    n_updates            | 2780       |
|    policy_gradient_loss | -0.00117   |
|    std                  | 0.824      |
|    value_loss           | 2.48e+04   |
----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.23e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 280         |
|    time_elapsed         | 3921        |
|    total_timesteps      | 573440      |
| train/                  |             |
|    approx_kl            | 0.002605407 |
|    clip_fraction        | 0.00332     |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | -0.0198     |
|    learning_rate        | 0.0003      |
|    loss                 | 3.57e+03    |
|    n_updates            | 2790        |
|    policy_gradient_loss | 0.000197    |
|    std                  | 0.823       |
|    value_loss           | 2.22e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.23e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 281          |
|    time_elapsed         | 3935         |
|    total_timesteps      | 575488       |
| train/                  |              |
|    approx_kl            | 0.0006279402 |
|    clip_fraction        | 0.00107      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | -0.0259      |
|    learning_rate        | 0.0003       |
|    loss                 | 3.65e+03     |
|    n_updates            | 2800         |
|    policy_gradient_loss | -0.000513    |
|    std                  | 0.823        |
|    value_loss           | 1.46e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.23e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 282         |
|    time_elapsed         | 3949        |
|    total_timesteps      | 577536      |
| train/                  |             |
|    approx_kl            | 0.007987397 |
|    clip_fraction        | 0.0717      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | -0.0385     |
|    learning_rate        | 0.0003      |
|    loss                 | 1.87e+04    |
|    n_updates            | 2810        |
|    policy_gradient_loss | -0.0041     |
|    std                  | 0.819       |
|    value_loss           | 3.21e+04    |
-----------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.23e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 283        |
|    time_elapsed         | 3963       |
|    total_timesteps      | 579584     |
| train/                  |            |
|    approx_kl            | 0.00377094 |
|    clip_fraction        | 0.00957    |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.43      |
|    explained_variance   | 0.0229     |
|    learning_rate        | 0.0003     |
|    loss                 | 1.95e+04   |
|    n_updates            | 2820       |
|    policy_gradient_loss | -0.00148   |
|    std                  | 0.816      |
|    value_loss           | 4.5e+04    |
----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.24e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 284          |
|    time_elapsed         | 3976         |
|    total_timesteps      | 581632       |
| train/                  |              |
|    approx_kl            | 0.0011386602 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 0.0991       |
|    learning_rate        | 0.0003       |
|    loss                 | 2.85e+03     |
|    n_updates            | 2830         |
|    policy_gradient_loss | 5.24e-05     |
|    std                  | 0.818        |
|    value_loss           | 1.3e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.24e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 285          |
|    time_elapsed         | 3990         |
|    total_timesteps      | 583680       |
| train/                  |              |
|    approx_kl            | 0.0019187813 |
|    clip_fraction        | 0.0155       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.44        |
|    explained_variance   | -0.0882      |
|    learning_rate        | 0.0003       |
|    loss                 | 8.84e+03     |
|    n_updates            | 2840         |
|    policy_gradient_loss | -0.000212    |
|    std                  | 0.824        |
|    value_loss           | 5.12e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.24e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 286        |
|    time_elapsed         | 4004       |
|    total_timesteps      | 585728     |
| train/                  |            |
|    approx_kl            | 0.01504888 |
|    clip_fraction        | 0.0872     |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.46      |
|    explained_variance   | 4.35e-05   |
|    learning_rate        | 0.0003     |
|    loss                 | 1.23e+04   |
|    n_updates            | 2850       |
|    policy_gradient_loss | -0.00333   |
|    std                  | 0.832      |
|    value_loss           | 4.46e+04   |
----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.24e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 287          |
|    time_elapsed         | 4018         |
|    total_timesteps      | 587776       |
| train/                  |              |
|    approx_kl            | 0.0076972907 |
|    clip_fraction        | 0.135        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | 2.38e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 2.52e+04     |
|    n_updates            | 2860         |
|    policy_gradient_loss | -0.00125     |
|    std                  | 0.823        |
|    value_loss           | 3.46e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.22e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 288         |
|    time_elapsed         | 4032        |
|    total_timesteps      | 589824      |
| train/                  |             |
|    approx_kl            | 0.004189547 |
|    clip_fraction        | 0.0371      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | 1.03e-05    |
|    learning_rate        | 0.0003      |
|    loss                 | 909         |
|    n_updates            | 2870        |
|    policy_gradient_loss | 0.000601    |
|    std                  | 0.817       |
|    value_loss           | 1.12e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.21e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 289          |
|    time_elapsed         | 4046         |
|    total_timesteps      | 591872       |
| train/                  |              |
|    approx_kl            | 0.0027379526 |
|    clip_fraction        | 0.000928     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.44        |
|    explained_variance   | 0.000245     |
|    learning_rate        | 0.0003       |
|    loss                 | 1.69e+04     |
|    n_updates            | 2880         |
|    policy_gradient_loss | -0.000259    |
|    std                  | 0.818        |
|    value_loss           | 1.93e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.2e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 290          |
|    time_elapsed         | 4060         |
|    total_timesteps      | 593920       |
| train/                  |              |
|    approx_kl            | 0.0006894174 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.44        |
|    explained_variance   | -0.0175      |
|    learning_rate        | 0.0003       |
|    loss                 | 5.21e+03     |
|    n_updates            | 2890         |
|    policy_gradient_loss | -7.45e-05    |
|    std                  | 0.819        |
|    value_loss           | 2.67e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.17e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 291          |
|    time_elapsed         | 4074         |
|    total_timesteps      | 595968       |
| train/                  |              |
|    approx_kl            | 0.0019507715 |
|    clip_fraction        | 0.000439     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 0.0564       |
|    learning_rate        | 0.0003       |
|    loss                 | 7.47e+03     |
|    n_updates            | 2900         |
|    policy_gradient_loss | -9.65e-05    |
|    std                  | 0.816        |
|    value_loss           | 2.17e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 292          |
|    time_elapsed         | 4088         |
|    total_timesteps      | 598016       |
| train/                  |              |
|    approx_kl            | 0.0066675055 |
|    clip_fraction        | 0.0463       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 0.0459       |
|    learning_rate        | 0.0003       |
|    loss                 | 1.51e+04     |
|    n_updates            | 2910         |
|    policy_gradient_loss | -0.000112    |
|    std                  | 0.813        |
|    value_loss           | 1.8e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.14e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 293         |
|    time_elapsed         | 4101        |
|    total_timesteps      | 600064      |
| train/                  |             |
|    approx_kl            | 0.004999628 |
|    clip_fraction        | 0.0658      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.42       |
|    explained_variance   | 0.0206      |
|    learning_rate        | 0.0003      |
|    loss                 | 2.29e+03    |
|    n_updates            | 2920        |
|    policy_gradient_loss | -0.00384    |
|    std                  | 0.809       |
|    value_loss           | 2.1e+04     |
-----------------------------------------


In [None]:
# from stable_baselines3 import PPO
# # Bring in the eval policy method for metric calculation
# from stable_baselines3.common.evaluation import evaluate_policy

now = datetime.now().strftime('%Y-%m-%d_%H%M')

LOG_DIR = './tmp/train/logs/' + now + '/'
OPT_DIR = './tmp/train/opt/' + now + '/'

SAVE_PATH = os.path.join(OPT_DIR, 'trial_{}_best_model'.format(1))

model = PPO(
    'MlpPolicy',
    env,
    tensorboard_log=LOG_DIR,
    verbose=1,
    # **model_params
)
# model.learn(total_timesteps=100_000)
model.learn(
    total_timesteps=600_000, 
    callback=TrainAndLoggingCallback(
        check_freq=10_000, 
        save_path=LOG_DIR
        )
    )

env.close()


Using cuda device
Wrapping the env in a DummyVecEnv.
Logging to ./tmp/train/logs/2022-03-03_1145/PPO_1


INFO:root:done


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1.2e+03  |
|    ep_rew_mean     | 1.16e+04 |
| time/              |          |
|    fps             | 161      |
|    iterations      | 1        |
|    time_elapsed    | 12       |
|    total_timesteps | 2048     |
---------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.17e+04    |
| time/                   |             |
|    fps                  | 152         |
|    iterations           | 2           |
|    time_elapsed         | 26          |
|    total_timesteps      | 4096        |
| train/                  |             |
|    approx_kl            | 0.004391538 |
|    clip_fraction        | 0.0325      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.85       |
|    explained_variance   | -0.0039     |
|    learning_rate        | 0.0003      |
|    loss                 | 1.11e+04    |
|    n_updates            | 10          |
|    policy_gradient_loss | -0.0065     |
|    std                  | 1.01        |
|    value_loss           | 2.29e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.2e+04      |
| time/                   |              |
|    fps                  | 148          |
|    iterations           | 3            |
|    time_elapsed         | 41           |
|    total_timesteps      | 6144         |
| train/                  |              |
|    approx_kl            | 0.0032937697 |
|    clip_fraction        | 0.0124       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.84        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 1.18e+04     |
|    n_updates            | 20           |
|    policy_gradient_loss | -0.00566     |
|    std                  | 0.999        |
|    value_loss           | 2.46e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.21e+04    |
| time/                   |             |
|    fps                  | 148         |
|    iterations           | 4           |
|    time_elapsed         | 55          |
|    total_timesteps      | 8192        |
| train/                  |             |
|    approx_kl            | 0.005230262 |
|    clip_fraction        | 0.0339      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.83       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.32e+04    |
|    n_updates            | 30          |
|    policy_gradient_loss | -0.00683    |
|    std                  | 0.995       |
|    value_loss           | 2.72e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.23e+04     |
| time/                   |              |
|    fps                  | 148          |
|    iterations           | 5            |
|    time_elapsed         | 69           |
|    total_timesteps      | 10240        |
| train/                  |              |
|    approx_kl            | 0.0058952486 |
|    clip_fraction        | 0.0416       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.82        |
|    explained_variance   | 5.6e-06      |
|    learning_rate        | 0.0003       |
|    loss                 | 1.33e+04     |
|    n_updates            | 40           |
|    policy_gradient_loss | -0.0103      |
|    std                  | 0.992        |
|    value_loss           | 2.78e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.23e+04     |
| time/                   |              |
|    fps                  | 147          |
|    iterations           | 6            |
|    time_elapsed         | 83           |
|    total_timesteps      | 12288        |
| train/                  |              |
|    approx_kl            | 0.0054528527 |
|    clip_fraction        | 0.0701       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.83        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.32e+04     |
|    n_updates            | 50           |
|    policy_gradient_loss | -0.00763     |
|    std                  | 0.997        |
|    value_loss           | 2.84e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.24e+04     |
| time/                   |              |
|    fps                  | 147          |
|    iterations           | 7            |
|    time_elapsed         | 97           |
|    total_timesteps      | 14336        |
| train/                  |              |
|    approx_kl            | 0.0056882296 |
|    clip_fraction        | 0.0507       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.82        |
|    explained_variance   | -8.34e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.34e+04     |
|    n_updates            | 60           |
|    policy_gradient_loss | -0.0167      |
|    std                  | 0.992        |
|    value_loss           | 2.68e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.26e+04    |
| time/                   |             |
|    fps                  | 147         |
|    iterations           | 8           |
|    time_elapsed         | 110         |
|    total_timesteps      | 16384       |
| train/                  |             |
|    approx_kl            | 0.005596227 |
|    clip_fraction        | 0.0539      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.82       |
|    explained_variance   | 1.07e-06    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.56e+04    |
|    n_updates            | 70          |
|    policy_gradient_loss | -0.00549    |
|    std                  | 0.994       |
|    value_loss           | 3.32e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.28e+04    |
| time/                   |             |
|    fps                  | 147         |
|    iterations           | 9           |
|    time_elapsed         | 124         |
|    total_timesteps      | 18432       |
| train/                  |             |
|    approx_kl            | 0.008129839 |
|    clip_fraction        | 0.0799      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.83       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.31e+04    |
|    n_updates            | 80          |
|    policy_gradient_loss | -0.00546    |
|    std                  | 1           |
|    value_loss           | 2.93e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.28e+04     |
| time/                   |              |
|    fps                  | 147          |
|    iterations           | 10           |
|    time_elapsed         | 138          |
|    total_timesteps      | 20480        |
| train/                  |              |
|    approx_kl            | 0.0076107667 |
|    clip_fraction        | 0.069        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.83        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.51e+04     |
|    n_updates            | 90           |
|    policy_gradient_loss | -0.023       |
|    std                  | 0.99         |
|    value_loss           | 3.23e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.29e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 11          |
|    time_elapsed         | 153         |
|    total_timesteps      | 22528       |
| train/                  |             |
|    approx_kl            | 0.011042925 |
|    clip_fraction        | 0.136       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.8        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.48e+04    |
|    n_updates            | 100         |
|    policy_gradient_loss | -0.0137     |
|    std                  | 0.979       |
|    value_loss           | 3.05e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.31e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 12         |
|    time_elapsed         | 167        |
|    total_timesteps      | 24576      |
| train/                  |            |
|    approx_kl            | 0.01359958 |
|    clip_fraction        | 0.144      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.78      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 1.54e+04   |
|    n_updates            | 110        |
|    policy_gradient_loss | -0.00544   |
|    std                  | 0.969      |
|    value_loss           | 3.27e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.32e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 13          |
|    time_elapsed         | 182         |
|    total_timesteps      | 26624       |
| train/                  |             |
|    approx_kl            | 0.004331241 |
|    clip_fraction        | 0.0518      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.77       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.67e+04    |
|    n_updates            | 120         |
|    policy_gradient_loss | -0.00361    |
|    std                  | 0.962       |
|    value_loss           | 3.36e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.32e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 14          |
|    time_elapsed         | 195         |
|    total_timesteps      | 28672       |
| train/                  |             |
|    approx_kl            | 0.008661566 |
|    clip_fraction        | 0.136       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.77       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.64e+04    |
|    n_updates            | 130         |
|    policy_gradient_loss | -0.0107     |
|    std                  | 0.967       |
|    value_loss           | 3.51e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.33e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 15          |
|    time_elapsed         | 209         |
|    total_timesteps      | 30720       |
| train/                  |             |
|    approx_kl            | 0.008165269 |
|    clip_fraction        | 0.0993      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.77       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.62e+04    |
|    n_updates            | 140         |
|    policy_gradient_loss | -0.00909    |
|    std                  | 0.967       |
|    value_loss           | 3.1e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.34e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 16          |
|    time_elapsed         | 223         |
|    total_timesteps      | 32768       |
| train/                  |             |
|    approx_kl            | 0.010763007 |
|    clip_fraction        | 0.116       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.77       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.46e+04    |
|    n_updates            | 150         |
|    policy_gradient_loss | -0.00913    |
|    std                  | 0.965       |
|    value_loss           | 3.02e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 17          |
|    time_elapsed         | 236         |
|    total_timesteps      | 34816       |
| train/                  |             |
|    approx_kl            | 0.010309635 |
|    clip_fraction        | 0.097       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.76       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.79e+04    |
|    n_updates            | 160         |
|    policy_gradient_loss | -0.016      |
|    std                  | 0.963       |
|    value_loss           | 3.72e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 18          |
|    time_elapsed         | 251         |
|    total_timesteps      | 36864       |
| train/                  |             |
|    approx_kl            | 0.010238191 |
|    clip_fraction        | 0.126       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.75       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.82e+04    |
|    n_updates            | 170         |
|    policy_gradient_loss | -0.0178     |
|    std                  | 0.952       |
|    value_loss           | 3.62e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.36e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 19          |
|    time_elapsed         | 265         |
|    total_timesteps      | 38912       |
| train/                  |             |
|    approx_kl            | 0.010769315 |
|    clip_fraction        | 0.113       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.73       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.38e+04    |
|    n_updates            | 180         |
|    policy_gradient_loss | -0.0116     |
|    std                  | 0.94        |
|    value_loss           | 3e+04       |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.36e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 20          |
|    time_elapsed         | 279         |
|    total_timesteps      | 40960       |
| train/                  |             |
|    approx_kl            | 0.011145861 |
|    clip_fraction        | 0.105       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.7        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.42e+04    |
|    n_updates            | 190         |
|    policy_gradient_loss | -0.0263     |
|    std                  | 0.923       |
|    value_loss           | 2.97e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.37e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 21          |
|    time_elapsed         | 293         |
|    total_timesteps      | 43008       |
| train/                  |             |
|    approx_kl            | 0.015250875 |
|    clip_fraction        | 0.136       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.66       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.64e+04    |
|    n_updates            | 200         |
|    policy_gradient_loss | -0.0171     |
|    std                  | 0.904       |
|    value_loss           | 3.27e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.37e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 22         |
|    time_elapsed         | 307        |
|    total_timesteps      | 45056      |
| train/                  |            |
|    approx_kl            | 0.01354915 |
|    clip_fraction        | 0.162      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.64      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 1.78e+04   |
|    n_updates            | 210        |
|    policy_gradient_loss | -0.00339   |
|    std                  | 0.905      |
|    value_loss           | 3.64e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.38e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 23          |
|    time_elapsed         | 321         |
|    total_timesteps      | 47104       |
| train/                  |             |
|    approx_kl            | 0.011652257 |
|    clip_fraction        | 0.152       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.39e+04    |
|    n_updates            | 220         |
|    policy_gradient_loss | -0.00208    |
|    std                  | 0.897       |
|    value_loss           | 2.98e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.39e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 24          |
|    time_elapsed         | 335         |
|    total_timesteps      | 49152       |
| train/                  |             |
|    approx_kl            | 0.008541563 |
|    clip_fraction        | 0.0871      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.72e+04    |
|    n_updates            | 230         |
|    policy_gradient_loss | -0.0154     |
|    std                  | 0.906       |
|    value_loss           | 3.31e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.4e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 25          |
|    time_elapsed         | 349         |
|    total_timesteps      | 51200       |
| train/                  |             |
|    approx_kl            | 0.009695856 |
|    clip_fraction        | 0.0991      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.64       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 3.03e+04    |
|    n_updates            | 240         |
|    policy_gradient_loss | -0.0225     |
|    std                  | 0.904       |
|    value_loss           | 5.91e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.41e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 26          |
|    time_elapsed         | 363         |
|    total_timesteps      | 53248       |
| train/                  |             |
|    approx_kl            | 0.016079355 |
|    clip_fraction        | 0.22        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.64       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.34e+04    |
|    n_updates            | 250         |
|    policy_gradient_loss | -0.0105     |
|    std                  | 0.903       |
|    value_loss           | 2.8e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.41e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 27          |
|    time_elapsed         | 377         |
|    total_timesteps      | 55296       |
| train/                  |             |
|    approx_kl            | 0.012627118 |
|    clip_fraction        | 0.132       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.99e+04    |
|    n_updates            | 260         |
|    policy_gradient_loss | -0.00803    |
|    std                  | 0.901       |
|    value_loss           | 4.56e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.42e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 28          |
|    time_elapsed         | 391         |
|    total_timesteps      | 57344       |
| train/                  |             |
|    approx_kl            | 0.014936594 |
|    clip_fraction        | 0.179       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.19e+04    |
|    n_updates            | 270         |
|    policy_gradient_loss | -0.00363    |
|    std                  | 0.901       |
|    value_loss           | 2.54e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.43e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 29          |
|    time_elapsed         | 405         |
|    total_timesteps      | 59392       |
| train/                  |             |
|    approx_kl            | 0.013621929 |
|    clip_fraction        | 0.139       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.87e+04    |
|    n_updates            | 280         |
|    policy_gradient_loss | -0.0116     |
|    std                  | 0.903       |
|    value_loss           | 5.49e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.46e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 30          |
|    time_elapsed         | 419         |
|    total_timesteps      | 61440       |
| train/                  |             |
|    approx_kl            | 0.014553876 |
|    clip_fraction        | 0.218       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.63       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.18e+04    |
|    n_updates            | 290         |
|    policy_gradient_loss | 0.00823     |
|    std                  | 0.9         |
|    value_loss           | 4.42e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.47e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 31          |
|    time_elapsed         | 433         |
|    total_timesteps      | 63488       |
| train/                  |             |
|    approx_kl            | 0.007278528 |
|    clip_fraction        | 0.09        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.62       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.93e+04    |
|    n_updates            | 300         |
|    policy_gradient_loss | -0.00995    |
|    std                  | 0.895       |
|    value_loss           | 7.37e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.48e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 32         |
|    time_elapsed         | 447        |
|    total_timesteps      | 65536      |
| train/                  |            |
|    approx_kl            | 0.01160966 |
|    clip_fraction        | 0.128      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.61      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 3.16e+04   |
|    n_updates            | 310        |
|    policy_gradient_loss | -0.00724   |
|    std                  | 0.894      |
|    value_loss           | 6.29e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.5e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 33          |
|    time_elapsed         | 461         |
|    total_timesteps      | 67584       |
| train/                  |             |
|    approx_kl            | 0.018593464 |
|    clip_fraction        | 0.14        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.62       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.96e+04    |
|    n_updates            | 320         |
|    policy_gradient_loss | -0.0151     |
|    std                  | 0.895       |
|    value_loss           | 3.84e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 1.2e+03   |
|    ep_rew_mean          | 1.51e+04  |
| time/                   |           |
|    fps                  | 146       |
|    iterations           | 34        |
|    time_elapsed         | 475       |
|    total_timesteps      | 69632     |
| train/                  |           |
|    approx_kl            | 0.0150782 |
|    clip_fraction        | 0.151     |
|    clip_range           | 0.2       |
|    entropy_loss         | -2.62     |
|    explained_variance   | 0         |
|    learning_rate        | 0.0003    |
|    loss                 | 3.27e+04  |
|    n_updates            | 330       |
|    policy_gradient_loss | -0.0103   |
|    std                  | 0.894     |
|    value_loss           | 6.71e+04  |
---------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.51e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 35           |
|    time_elapsed         | 489          |
|    total_timesteps      | 71680        |
| train/                  |              |
|    approx_kl            | 0.0122095235 |
|    clip_fraction        | 0.136        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.62        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.19e+04     |
|    n_updates            | 340          |
|    policy_gradient_loss | -0.00897     |
|    std                  | 0.893        |
|    value_loss           | 4.53e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.54e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 36          |
|    time_elapsed         | 503         |
|    total_timesteps      | 73728       |
| train/                  |             |
|    approx_kl            | 0.007932127 |
|    clip_fraction        | 0.0719      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.61       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.45e+04    |
|    n_updates            | 350         |
|    policy_gradient_loss | -0.00412    |
|    std                  | 0.893       |
|    value_loss           | 5.21e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.54e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 37          |
|    time_elapsed         | 517         |
|    total_timesteps      | 75776       |
| train/                  |             |
|    approx_kl            | 0.013687752 |
|    clip_fraction        | 0.148       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.62       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.75e+04    |
|    n_updates            | 360         |
|    policy_gradient_loss | -0.00648    |
|    std                  | 0.901       |
|    value_loss           | 7.21e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.54e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 38          |
|    time_elapsed         | 531         |
|    total_timesteps      | 77824       |
| train/                  |             |
|    approx_kl            | 0.019635525 |
|    clip_fraction        | 0.196       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.62       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.77e+04    |
|    n_updates            | 370         |
|    policy_gradient_loss | -0.00608    |
|    std                  | 0.894       |
|    value_loss           | 3.67e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.55e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 39          |
|    time_elapsed         | 545         |
|    total_timesteps      | 79872       |
| train/                  |             |
|    approx_kl            | 0.014820069 |
|    clip_fraction        | 0.152       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.6        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.49e+04    |
|    n_updates            | 380         |
|    policy_gradient_loss | -0.0325     |
|    std                  | 0.884       |
|    value_loss           | 3.3e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.55e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 40          |
|    time_elapsed         | 559         |
|    total_timesteps      | 81920       |
| train/                  |             |
|    approx_kl            | 0.023059068 |
|    clip_fraction        | 0.237       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.59       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.74e+04    |
|    n_updates            | 390         |
|    policy_gradient_loss | -0.000467   |
|    std                  | 0.881       |
|    value_loss           | 4.08e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.55e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 41          |
|    time_elapsed         | 573         |
|    total_timesteps      | 83968       |
| train/                  |             |
|    approx_kl            | 0.018831586 |
|    clip_fraction        | 0.169       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.58       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.04e+04    |
|    n_updates            | 400         |
|    policy_gradient_loss | -0.0248     |
|    std                  | 0.872       |
|    value_loss           | 4.24e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.56e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 42          |
|    time_elapsed         | 587         |
|    total_timesteps      | 86016       |
| train/                  |             |
|    approx_kl            | 0.023009354 |
|    clip_fraction        | 0.213       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.57       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.63e+04    |
|    n_updates            | 410         |
|    policy_gradient_loss | 0.00402     |
|    std                  | 0.876       |
|    value_loss           | 5.39e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.58e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 43          |
|    time_elapsed         | 601         |
|    total_timesteps      | 88064       |
| train/                  |             |
|    approx_kl            | 0.012054702 |
|    clip_fraction        | 0.149       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.56       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.72e+04    |
|    n_updates            | 420         |
|    policy_gradient_loss | -0.00522    |
|    std                  | 0.866       |
|    value_loss           | 5.18e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.59e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 44          |
|    time_elapsed         | 615         |
|    total_timesteps      | 90112       |
| train/                  |             |
|    approx_kl            | 0.018233374 |
|    clip_fraction        | 0.146       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.54       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 4.14e+04    |
|    n_updates            | 430         |
|    policy_gradient_loss | -0.00968    |
|    std                  | 0.854       |
|    value_loss           | 7.75e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.69e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 45          |
|    time_elapsed         | 629         |
|    total_timesteps      | 92160       |
| train/                  |             |
|    approx_kl            | 0.030004544 |
|    clip_fraction        | 0.289       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.52       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.45e+04    |
|    n_updates            | 440         |
|    policy_gradient_loss | 0.00773     |
|    std                  | 0.856       |
|    value_loss           | 4.6e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.7e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 46           |
|    time_elapsed         | 643          |
|    total_timesteps      | 94208        |
| train/                  |              |
|    approx_kl            | 0.0057585663 |
|    clip_fraction        | 0.0339       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.52        |
|    explained_variance   | -2.38e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.04e+06     |
|    n_updates            | 450          |
|    policy_gradient_loss | -0.00344     |
|    std                  | 0.851        |
|    value_loss           | 3.83e+06     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.7e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 47           |
|    time_elapsed         | 656          |
|    total_timesteps      | 96256        |
| train/                  |              |
|    approx_kl            | 0.0145547455 |
|    clip_fraction        | 0.131        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.49        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.97e+04     |
|    n_updates            | 460          |
|    policy_gradient_loss | -0.0207      |
|    std                  | 0.832        |
|    value_loss           | 4.46e+04     |
------------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.7e+04    |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 48         |
|    time_elapsed         | 670        |
|    total_timesteps      | 98304      |
| train/                  |            |
|    approx_kl            | 0.02108854 |
|    clip_fraction        | 0.216      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.47      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 2.17e+04   |
|    n_updates            | 470        |
|    policy_gradient_loss | -0.000534  |
|    std                  | 0.836      |
|    value_loss           | 4.14e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.7e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 49          |
|    time_elapsed         | 685         |
|    total_timesteps      | 100352      |
| train/                  |             |
|    approx_kl            | 0.021511838 |
|    clip_fraction        | 0.235       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.84e+04    |
|    n_updates            | 480         |
|    policy_gradient_loss | 0.00179     |
|    std                  | 0.835       |
|    value_loss           | 3.83e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.71e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 50          |
|    time_elapsed         | 699         |
|    total_timesteps      | 102400      |
| train/                  |             |
|    approx_kl            | 0.022287574 |
|    clip_fraction        | 0.247       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.49       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.49e+04    |
|    n_updates            | 490         |
|    policy_gradient_loss | 0.00136     |
|    std                  | 0.842       |
|    value_loss           | 3.27e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.71e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 51          |
|    time_elapsed         | 713         |
|    total_timesteps      | 104448      |
| train/                  |             |
|    approx_kl            | 0.009410672 |
|    clip_fraction        | 0.0986      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.49       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 3.92e+04    |
|    n_updates            | 500         |
|    policy_gradient_loss | -0.00541    |
|    std                  | 0.836       |
|    value_loss           | 6.97e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.71e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 52          |
|    time_elapsed         | 727         |
|    total_timesteps      | 106496      |
| train/                  |             |
|    approx_kl            | 0.018075552 |
|    clip_fraction        | 0.198       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.55e+04    |
|    n_updates            | 510         |
|    policy_gradient_loss | -0.011      |
|    std                  | 0.834       |
|    value_loss           | 5.08e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.72e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 53          |
|    time_elapsed         | 741         |
|    total_timesteps      | 108544      |
| train/                  |             |
|    approx_kl            | 0.015388653 |
|    clip_fraction        | 0.179       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.59e+04    |
|    n_updates            | 520         |
|    policy_gradient_loss | -0.0115     |
|    std                  | 0.836       |
|    value_loss           | 3.43e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 54          |
|    time_elapsed         | 755         |
|    total_timesteps      | 110592      |
| train/                  |             |
|    approx_kl            | 0.011160995 |
|    clip_fraction        | 0.123       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 3.9e+04     |
|    n_updates            | 530         |
|    policy_gradient_loss | -0.0146     |
|    std                  | 0.832       |
|    value_loss           | 8.16e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 55          |
|    time_elapsed         | 769         |
|    total_timesteps      | 112640      |
| train/                  |             |
|    approx_kl            | 0.013476456 |
|    clip_fraction        | 0.158       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.48       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 3.69e+04    |
|    n_updates            | 540         |
|    policy_gradient_loss | -0.00493    |
|    std                  | 0.841       |
|    value_loss           | 6.68e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 56          |
|    time_elapsed         | 783         |
|    total_timesteps      | 114688      |
| train/                  |             |
|    approx_kl            | 0.015881626 |
|    clip_fraction        | 0.173       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.5        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.83e+04    |
|    n_updates            | 550         |
|    policy_gradient_loss | -0.0252     |
|    std                  | 0.843       |
|    value_loss           | 3.78e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 57          |
|    time_elapsed         | 797         |
|    total_timesteps      | 116736      |
| train/                  |             |
|    approx_kl            | 0.026833735 |
|    clip_fraction        | 0.234       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.43e+04    |
|    n_updates            | 560         |
|    policy_gradient_loss | -0.00958    |
|    std                  | 0.828       |
|    value_loss           | 3.05e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.73e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 58          |
|    time_elapsed         | 812         |
|    total_timesteps      | 118784      |
| train/                  |             |
|    approx_kl            | 0.028344654 |
|    clip_fraction        | 0.278       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.4e+04     |
|    n_updates            | 570         |
|    policy_gradient_loss | 0.00196     |
|    std                  | 0.82        |
|    value_loss           | 2.68e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.74e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 59          |
|    time_elapsed         | 825         |
|    total_timesteps      | 120832      |
| train/                  |             |
|    approx_kl            | 0.015825741 |
|    clip_fraction        | 0.156       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.94e+04    |
|    n_updates            | 580         |
|    policy_gradient_loss | 0.000557    |
|    std                  | 0.826       |
|    value_loss           | 5.74e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.75e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 60         |
|    time_elapsed         | 839        |
|    total_timesteps      | 122880     |
| train/                  |            |
|    approx_kl            | 0.02055395 |
|    clip_fraction        | 0.19       |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.45      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 1.51e+04   |
|    n_updates            | 590        |
|    policy_gradient_loss | 0.0043     |
|    std                  | 0.819      |
|    value_loss           | 3.72e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.76e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 61          |
|    time_elapsed         | 853         |
|    total_timesteps      | 124928      |
| train/                  |             |
|    approx_kl            | 0.013689511 |
|    clip_fraction        | 0.14        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.54e+04    |
|    n_updates            | 600         |
|    policy_gradient_loss | -0.021      |
|    std                  | 0.819       |
|    value_loss           | 3.43e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.76e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 62          |
|    time_elapsed         | 867         |
|    total_timesteps      | 126976      |
| train/                  |             |
|    approx_kl            | 0.015221818 |
|    clip_fraction        | 0.168       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.43       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.61e+04    |
|    n_updates            | 610         |
|    policy_gradient_loss | -0.0285     |
|    std                  | 0.813       |
|    value_loss           | 3.37e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.76e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 63         |
|    time_elapsed         | 881        |
|    total_timesteps      | 129024     |
| train/                  |            |
|    approx_kl            | 0.04071191 |
|    clip_fraction        | 0.319      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.42      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 9.33e+03   |
|    n_updates            | 620        |
|    policy_gradient_loss | 0.011      |
|    std                  | 0.811      |
|    value_loss           | 1.98e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.77e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 64          |
|    time_elapsed         | 895         |
|    total_timesteps      | 131072      |
| train/                  |             |
|    approx_kl            | 0.017623218 |
|    clip_fraction        | 0.167       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.43       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8.13e+03    |
|    n_updates            | 630         |
|    policy_gradient_loss | -0.00306    |
|    std                  | 0.814       |
|    value_loss           | 1.64e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.77e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 65          |
|    time_elapsed         | 910         |
|    total_timesteps      | 133120      |
| train/                  |             |
|    approx_kl            | 0.016778994 |
|    clip_fraction        | 0.204       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.43       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 8.33e+03    |
|    n_updates            | 640         |
|    policy_gradient_loss | 0.00403     |
|    std                  | 0.815       |
|    value_loss           | 1.96e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.77e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 66          |
|    time_elapsed         | 924         |
|    total_timesteps      | 135168      |
| train/                  |             |
|    approx_kl            | 0.021337302 |
|    clip_fraction        | 0.164       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.42       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.65e+03    |
|    n_updates            | 650         |
|    policy_gradient_loss | 0.00748     |
|    std                  | 0.807       |
|    value_loss           | 1.62e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.77e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 67          |
|    time_elapsed         | 938         |
|    total_timesteps      | 137216      |
| train/                  |             |
|    approx_kl            | 0.008562895 |
|    clip_fraction        | 0.0779      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.06e+03    |
|    n_updates            | 660         |
|    policy_gradient_loss | -0.00562    |
|    std                  | 0.805       |
|    value_loss           | 1.56e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.78e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 68          |
|    time_elapsed         | 952         |
|    total_timesteps      | 139264      |
| train/                  |             |
|    approx_kl            | 0.009808671 |
|    clip_fraction        | 0.107       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 9.21e+03    |
|    n_updates            | 670         |
|    policy_gradient_loss | -0.0133     |
|    std                  | 0.801       |
|    value_loss           | 2.23e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.78e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 69          |
|    time_elapsed         | 966         |
|    total_timesteps      | 141312      |
| train/                  |             |
|    approx_kl            | 0.012630733 |
|    clip_fraction        | 0.118       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.12e+04    |
|    n_updates            | 680         |
|    policy_gradient_loss | -0.00732    |
|    std                  | 0.803       |
|    value_loss           | 2.18e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.79e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 70          |
|    time_elapsed         | 981         |
|    total_timesteps      | 143360      |
| train/                  |             |
|    approx_kl            | 0.012141417 |
|    clip_fraction        | 0.116       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.42e+04    |
|    n_updates            | 690         |
|    policy_gradient_loss | -0.0226     |
|    std                  | 0.795       |
|    value_loss           | 5.2e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.8e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 71          |
|    time_elapsed         | 995         |
|    total_timesteps      | 145408      |
| train/                  |             |
|    approx_kl            | 0.023457542 |
|    clip_fraction        | 0.255       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.07e+04    |
|    n_updates            | 700         |
|    policy_gradient_loss | -0.00289    |
|    std                  | 0.796       |
|    value_loss           | 2.84e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.8e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 72          |
|    time_elapsed         | 1009        |
|    total_timesteps      | 147456      |
| train/                  |             |
|    approx_kl            | 0.011387791 |
|    clip_fraction        | 0.13        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.26e+04    |
|    n_updates            | 710         |
|    policy_gradient_loss | -0.00732    |
|    std                  | 0.792       |
|    value_loss           | 4.41e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.81e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 73          |
|    time_elapsed         | 1023        |
|    total_timesteps      | 149504      |
| train/                  |             |
|    approx_kl            | 0.017695563 |
|    clip_fraction        | 0.173       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 2.38e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 8.58e+03    |
|    n_updates            | 720         |
|    policy_gradient_loss | -0.0087     |
|    std                  | 0.788       |
|    value_loss           | 1.87e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.81e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 74          |
|    time_elapsed         | 1037        |
|    total_timesteps      | 151552      |
| train/                  |             |
|    approx_kl            | 0.018687332 |
|    clip_fraction        | 0.163       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.59e+04    |
|    n_updates            | 730         |
|    policy_gradient_loss | 0.00265     |
|    std                  | 0.794       |
|    value_loss           | 3.09e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.81e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 75          |
|    time_elapsed         | 1052        |
|    total_timesteps      | 153600      |
| train/                  |             |
|    approx_kl            | 0.015589951 |
|    clip_fraction        | 0.124       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.37e+04    |
|    n_updates            | 740         |
|    policy_gradient_loss | -0.00322    |
|    std                  | 0.801       |
|    value_loss           | 2.91e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 76          |
|    time_elapsed         | 1067        |
|    total_timesteps      | 155648      |
| train/                  |             |
|    approx_kl            | 0.026954753 |
|    clip_fraction        | 0.211       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 7.6e+03     |
|    n_updates            | 750         |
|    policy_gradient_loss | 0.00466     |
|    std                  | 0.803       |
|    value_loss           | 1.77e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 77          |
|    time_elapsed         | 1081        |
|    total_timesteps      | 157696      |
| train/                  |             |
|    approx_kl            | 0.021868024 |
|    clip_fraction        | 0.171       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.55e+04    |
|    n_updates            | 760         |
|    policy_gradient_loss | -0.000461   |
|    std                  | 0.798       |
|    value_loss           | 2.71e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 78          |
|    time_elapsed         | 1095        |
|    total_timesteps      | 159744      |
| train/                  |             |
|    approx_kl            | 0.010552238 |
|    clip_fraction        | 0.145       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.31e+04    |
|    n_updates            | 770         |
|    policy_gradient_loss | -0.000139   |
|    std                  | 0.799       |
|    value_loss           | 2.61e+04    |
-----------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.82e+04   |
| time/                   |            |
|    fps                  | 145        |
|    iterations           | 79         |
|    time_elapsed         | 1109       |
|    total_timesteps      | 161792     |
| train/                  |            |
|    approx_kl            | 0.01820229 |
|    clip_fraction        | 0.185      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.38      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 7.76e+03   |
|    n_updates            | 780        |
|    policy_gradient_loss | 0.000961   |
|    std                  | 0.797      |
|    value_loss           | 1.66e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.83e+04   |
| time/                   |            |
|    fps                  | 145        |
|    iterations           | 80         |
|    time_elapsed         | 1123       |
|    total_timesteps      | 163840     |
| train/                  |            |
|    approx_kl            | 0.01317868 |
|    clip_fraction        | 0.149      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.37      |
|    explained_variance   | 5.96e-08   |
|    learning_rate        | 0.0003     |
|    loss                 | 1.53e+04   |
|    n_updates            | 790        |
|    policy_gradient_loss | 0.000614   |
|    std                  | 0.787      |
|    value_loss           | 2.74e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 81          |
|    time_elapsed         | 1137        |
|    total_timesteps      | 165888      |
| train/                  |             |
|    approx_kl            | 0.009161064 |
|    clip_fraction        | 0.142       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.01e+04    |
|    n_updates            | 800         |
|    policy_gradient_loss | -0.00327    |
|    std                  | 0.785       |
|    value_loss           | 2.47e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 82          |
|    time_elapsed         | 1151        |
|    total_timesteps      | 167936      |
| train/                  |             |
|    approx_kl            | 0.009845901 |
|    clip_fraction        | 0.154       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8.07e+03    |
|    n_updates            | 810         |
|    policy_gradient_loss | 0.000412    |
|    std                  | 0.789       |
|    value_loss           | 1.35e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.83e+04     |
| time/                   |              |
|    fps                  | 145          |
|    iterations           | 83           |
|    time_elapsed         | 1165         |
|    total_timesteps      | 169984       |
| train/                  |              |
|    approx_kl            | 0.0045108087 |
|    clip_fraction        | 0.0742       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.37        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.34e+04     |
|    n_updates            | 820          |
|    policy_gradient_loss | -0.000618    |
|    std                  | 0.793        |
|    value_loss           | 2.69e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.84e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 84          |
|    time_elapsed         | 1179        |
|    total_timesteps      | 172032      |
| train/                  |             |
|    approx_kl            | 0.007392233 |
|    clip_fraction        | 0.077       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 7.97e+03    |
|    n_updates            | 830         |
|    policy_gradient_loss | -4.53e-05   |
|    std                  | 0.803       |
|    value_loss           | 1.55e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.85e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 85          |
|    time_elapsed         | 1192        |
|    total_timesteps      | 174080      |
| train/                  |             |
|    approx_kl            | 0.007693232 |
|    clip_fraction        | 0.0707      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.41e+04    |
|    n_updates            | 840         |
|    policy_gradient_loss | -0.0114     |
|    std                  | 0.805       |
|    value_loss           | 6.44e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.86e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 86          |
|    time_elapsed         | 1206        |
|    total_timesteps      | 176128      |
| train/                  |             |
|    approx_kl            | 0.003904311 |
|    clip_fraction        | 0.0364      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.42e+04    |
|    n_updates            | 850         |
|    policy_gradient_loss | -0.00264    |
|    std                  | 0.805       |
|    value_loss           | 5.99e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.85e+04    |
| time/                   |             |
|    fps                  | 145         |
|    iterations           | 87          |
|    time_elapsed         | 1220        |
|    total_timesteps      | 178176      |
| train/                  |             |
|    approx_kl            | 0.010545602 |
|    clip_fraction        | 0.105       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 9.32e+03    |
|    n_updates            | 860         |
|    policy_gradient_loss | 0.00275     |
|    std                  | 0.796       |
|    value_loss           | 1.8e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.85e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 88           |
|    time_elapsed         | 1234         |
|    total_timesteps      | 180224       |
| train/                  |              |
|    approx_kl            | 0.0038952979 |
|    clip_fraction        | 0.0241       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 1.68e+04     |
|    n_updates            | 870          |
|    policy_gradient_loss | 0.00032      |
|    std                  | 0.799        |
|    value_loss           | 3.36e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.85e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 89           |
|    time_elapsed         | 1248         |
|    total_timesteps      | 182272       |
| train/                  |              |
|    approx_kl            | 0.0048363013 |
|    clip_fraction        | 0.0596       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.55e+04     |
|    n_updates            | 880          |
|    policy_gradient_loss | -0.00258     |
|    std                  | 0.807        |
|    value_loss           | 2.86e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.86e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 90          |
|    time_elapsed         | 1262        |
|    total_timesteps      | 184320      |
| train/                  |             |
|    approx_kl            | 0.005844402 |
|    clip_fraction        | 0.0595      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.69e+04    |
|    n_updates            | 890         |
|    policy_gradient_loss | -0.00509    |
|    std                  | 0.799       |
|    value_loss           | 4.7e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.86e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 91           |
|    time_elapsed         | 1276         |
|    total_timesteps      | 186368       |
| train/                  |              |
|    approx_kl            | 0.0035861044 |
|    clip_fraction        | 0.0293       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 2.3e+04      |
|    n_updates            | 900          |
|    policy_gradient_loss | -0.00208     |
|    std                  | 0.796        |
|    value_loss           | 4.29e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.86e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 92          |
|    time_elapsed         | 1290        |
|    total_timesteps      | 188416      |
| train/                  |             |
|    approx_kl            | 0.008172901 |
|    clip_fraction        | 0.0651      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.9e+04     |
|    n_updates            | 910         |
|    policy_gradient_loss | -0.00517    |
|    std                  | 0.796       |
|    value_loss           | 4.44e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.87e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 93           |
|    time_elapsed         | 1303         |
|    total_timesteps      | 190464       |
| train/                  |              |
|    approx_kl            | 0.0052236803 |
|    clip_fraction        | 0.0422       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.46e+04     |
|    n_updates            | 920          |
|    policy_gradient_loss | -0.00326     |
|    std                  | 0.792        |
|    value_loss           | 2.86e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.87e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 94          |
|    time_elapsed         | 1318        |
|    total_timesteps      | 192512      |
| train/                  |             |
|    approx_kl            | 0.006089763 |
|    clip_fraction        | 0.0486      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.73e+04    |
|    n_updates            | 930         |
|    policy_gradient_loss | -0.0059     |
|    std                  | 0.795       |
|    value_loss           | 6.3e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.87e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 95          |
|    time_elapsed         | 1332        |
|    total_timesteps      | 194560      |
| train/                  |             |
|    approx_kl            | 0.007236196 |
|    clip_fraction        | 0.0645      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.39e+04    |
|    n_updates            | 940         |
|    policy_gradient_loss | -0.00312    |
|    std                  | 0.785       |
|    value_loss           | 6.63e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.88e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 96          |
|    time_elapsed         | 1345        |
|    total_timesteps      | 196608      |
| train/                  |             |
|    approx_kl            | 0.009198414 |
|    clip_fraction        | 0.122       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.32e+04    |
|    n_updates            | 950         |
|    policy_gradient_loss | -0.00422    |
|    std                  | 0.782       |
|    value_loss           | 2.8e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.88e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 97          |
|    time_elapsed         | 1359        |
|    total_timesteps      | 198656      |
| train/                  |             |
|    approx_kl            | 0.011152923 |
|    clip_fraction        | 0.0958      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.34e+04    |
|    n_updates            | 960         |
|    policy_gradient_loss | -0.00434    |
|    std                  | 0.785       |
|    value_loss           | 4.03e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.89e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 98          |
|    time_elapsed         | 1373        |
|    total_timesteps      | 200704      |
| train/                  |             |
|    approx_kl            | 0.006587811 |
|    clip_fraction        | 0.0738      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.81e+03    |
|    n_updates            | 970         |
|    policy_gradient_loss | -0.00277    |
|    std                  | 0.799       |
|    value_loss           | 1.71e+04    |
-----------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 1.9e+04    |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 99         |
|    time_elapsed         | 1387       |
|    total_timesteps      | 202752     |
| train/                  |            |
|    approx_kl            | 0.01411744 |
|    clip_fraction        | 0.0879     |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.4       |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 4.55e+04   |
|    n_updates            | 980        |
|    policy_gradient_loss | -0.00203   |
|    std                  | 0.804      |
|    value_loss           | 7.91e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.9e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 100         |
|    time_elapsed         | 1401        |
|    total_timesteps      | 204800      |
| train/                  |             |
|    approx_kl            | 0.013300964 |
|    clip_fraction        | 0.139       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 3.17e+04    |
|    n_updates            | 990         |
|    policy_gradient_loss | -0.0212     |
|    std                  | 0.793       |
|    value_loss           | 6.25e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.89e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 101         |
|    time_elapsed         | 1415        |
|    total_timesteps      | 206848      |
| train/                  |             |
|    approx_kl            | 0.010988854 |
|    clip_fraction        | 0.116       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.79e+04    |
|    n_updates            | 1000        |
|    policy_gradient_loss | -0.000685   |
|    std                  | 0.797       |
|    value_loss           | 3.73e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.89e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 102         |
|    time_elapsed         | 1429        |
|    total_timesteps      | 208896      |
| train/                  |             |
|    approx_kl            | 0.020069811 |
|    clip_fraction        | 0.228       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 9.58e+03    |
|    n_updates            | 1010        |
|    policy_gradient_loss | 0.00113     |
|    std                  | 0.793       |
|    value_loss           | 1.88e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.9e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 103         |
|    time_elapsed         | 1442        |
|    total_timesteps      | 210944      |
| train/                  |             |
|    approx_kl            | 0.010540705 |
|    clip_fraction        | 0.141       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.46e+04    |
|    n_updates            | 1020        |
|    policy_gradient_loss | 0.0011      |
|    std                  | 0.796       |
|    value_loss           | 3.87e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 104         |
|    time_elapsed         | 1456        |
|    total_timesteps      | 212992      |
| train/                  |             |
|    approx_kl            | 0.009418109 |
|    clip_fraction        | 0.115       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.64e+04    |
|    n_updates            | 1030        |
|    policy_gradient_loss | -0.00633    |
|    std                  | 0.791       |
|    value_loss           | 3.95e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 105         |
|    time_elapsed         | 1471        |
|    total_timesteps      | 215040      |
| train/                  |             |
|    approx_kl            | 0.012258687 |
|    clip_fraction        | 0.126       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.26e+04    |
|    n_updates            | 1040        |
|    policy_gradient_loss | -0.00352    |
|    std                  | 0.8         |
|    value_loss           | 3.1e+04     |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 106         |
|    time_elapsed         | 1484        |
|    total_timesteps      | 217088      |
| train/                  |             |
|    approx_kl            | 0.012993254 |
|    clip_fraction        | 0.159       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 7.52e+03    |
|    n_updates            | 1050        |
|    policy_gradient_loss | -0.00172    |
|    std                  | 0.801       |
|    value_loss           | 1.62e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 107         |
|    time_elapsed         | 1498        |
|    total_timesteps      | 219136      |
| train/                  |             |
|    approx_kl            | 0.016626261 |
|    clip_fraction        | 0.13        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.26e+04    |
|    n_updates            | 1060        |
|    policy_gradient_loss | -0.00246    |
|    std                  | 0.807       |
|    value_loss           | 2.54e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 108         |
|    time_elapsed         | 1512        |
|    total_timesteps      | 221184      |
| train/                  |             |
|    approx_kl            | 0.011392436 |
|    clip_fraction        | 0.127       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.26e+04    |
|    n_updates            | 1070        |
|    policy_gradient_loss | -0.0107     |
|    std                  | 0.805       |
|    value_loss           | 2.62e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 109         |
|    time_elapsed         | 1525        |
|    total_timesteps      | 223232      |
| train/                  |             |
|    approx_kl            | 0.009496073 |
|    clip_fraction        | 0.0987      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.8e+04     |
|    n_updates            | 1080        |
|    policy_gradient_loss | -0.00546    |
|    std                  | 0.8         |
|    value_loss           | 3.46e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 110         |
|    time_elapsed         | 1540        |
|    total_timesteps      | 225280      |
| train/                  |             |
|    approx_kl            | 0.012582979 |
|    clip_fraction        | 0.168       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.79e+04    |
|    n_updates            | 1090        |
|    policy_gradient_loss | -0.00456    |
|    std                  | 0.8         |
|    value_loss           | 3.6e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 111         |
|    time_elapsed         | 1553        |
|    total_timesteps      | 227328      |
| train/                  |             |
|    approx_kl            | 0.022164816 |
|    clip_fraction        | 0.167       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 6.02e+03    |
|    n_updates            | 1100        |
|    policy_gradient_loss | 0.00299     |
|    std                  | 0.813       |
|    value_loss           | 1.3e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 112         |
|    time_elapsed         | 1567        |
|    total_timesteps      | 229376      |
| train/                  |             |
|    approx_kl            | 0.008020125 |
|    clip_fraction        | 0.0919      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.42       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.25e+04    |
|    n_updates            | 1110        |
|    policy_gradient_loss | -0.00131    |
|    std                  | 0.808       |
|    value_loss           | 5.24e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 113         |
|    time_elapsed         | 1581        |
|    total_timesteps      | 231424      |
| train/                  |             |
|    approx_kl            | 0.007745044 |
|    clip_fraction        | 0.0853      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.7e+04     |
|    n_updates            | 1120        |
|    policy_gradient_loss | -0.00879    |
|    std                  | 0.808       |
|    value_loss           | 2.93e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 1.82e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 114          |
|    time_elapsed         | 1596         |
|    total_timesteps      | 233472       |
| train/                  |              |
|    approx_kl            | 0.0050633173 |
|    clip_fraction        | 0.0913       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.13e+04     |
|    n_updates            | 1130         |
|    policy_gradient_loss | 0.00214      |
|    std                  | 0.794        |
|    value_loss           | 2.24e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.82e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 115         |
|    time_elapsed         | 1610        |
|    total_timesteps      | 235520      |
| train/                  |             |
|    approx_kl            | 0.009911083 |
|    clip_fraction        | 0.113       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.08e+04    |
|    n_updates            | 1140        |
|    policy_gradient_loss | -0.00607    |
|    std                  | 0.792       |
|    value_loss           | 2.13e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 116         |
|    time_elapsed         | 1624        |
|    total_timesteps      | 237568      |
| train/                  |             |
|    approx_kl            | 0.013709651 |
|    clip_fraction        | 0.132       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.92e+04    |
|    n_updates            | 1150        |
|    policy_gradient_loss | -0.018      |
|    std                  | 0.796       |
|    value_loss           | 3.45e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.83e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 117         |
|    time_elapsed         | 1638        |
|    total_timesteps      | 239616      |
| train/                  |             |
|    approx_kl            | 0.012580525 |
|    clip_fraction        | 0.136       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.82e+04    |
|    n_updates            | 1160        |
|    policy_gradient_loss | 0.00117     |
|    std                  | 0.795       |
|    value_loss           | 3.49e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.84e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 118         |
|    time_elapsed         | 1652        |
|    total_timesteps      | 241664      |
| train/                  |             |
|    approx_kl            | 0.012209925 |
|    clip_fraction        | 0.141       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.38       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.32e+04    |
|    n_updates            | 1170        |
|    policy_gradient_loss | -0.00163    |
|    std                  | 0.793       |
|    value_loss           | 2.49e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.85e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 119         |
|    time_elapsed         | 1667        |
|    total_timesteps      | 243712      |
| train/                  |             |
|    approx_kl            | 0.014715998 |
|    clip_fraction        | 0.148       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.49e+04    |
|    n_updates            | 1180        |
|    policy_gradient_loss | -0.0196     |
|    std                  | 0.787       |
|    value_loss           | 3.04e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.85e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 120         |
|    time_elapsed         | 1681        |
|    total_timesteps      | 245760      |
| train/                  |             |
|    approx_kl            | 0.012587525 |
|    clip_fraction        | 0.0777      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.2e+04     |
|    n_updates            | 1190        |
|    policy_gradient_loss | -0.00513    |
|    std                  | 0.78        |
|    value_loss           | 6.58e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.86e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 121         |
|    time_elapsed         | 1695        |
|    total_timesteps      | 247808      |
| train/                  |             |
|    approx_kl            | 0.017470002 |
|    clip_fraction        | 0.16        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.34e+04    |
|    n_updates            | 1200        |
|    policy_gradient_loss | 0.000161    |
|    std                  | 0.787       |
|    value_loss           | 2.82e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.87e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 122         |
|    time_elapsed         | 1710        |
|    total_timesteps      | 249856      |
| train/                  |             |
|    approx_kl            | 0.012832021 |
|    clip_fraction        | 0.123       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.17e+04    |
|    n_updates            | 1210        |
|    policy_gradient_loss | -0.000444   |
|    std                  | 0.783       |
|    value_loss           | 3.83e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.88e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 123         |
|    time_elapsed         | 1723        |
|    total_timesteps      | 251904      |
| train/                  |             |
|    approx_kl            | 0.014430864 |
|    clip_fraction        | 0.149       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.04e+04    |
|    n_updates            | 1220        |
|    policy_gradient_loss | -0.00634    |
|    std                  | 0.788       |
|    value_loss           | 1.51e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.89e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 124         |
|    time_elapsed         | 1737        |
|    total_timesteps      | 253952      |
| train/                  |             |
|    approx_kl            | 0.014055605 |
|    clip_fraction        | 0.124       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.82e+04    |
|    n_updates            | 1230        |
|    policy_gradient_loss | -0.0191     |
|    std                  | 0.785       |
|    value_loss           | 4.33e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.91e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 125         |
|    time_elapsed         | 1751        |
|    total_timesteps      | 256000      |
| train/                  |             |
|    approx_kl            | 0.016250223 |
|    clip_fraction        | 0.169       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.46e+04    |
|    n_updates            | 1240        |
|    policy_gradient_loss | -0.00511    |
|    std                  | 0.789       |
|    value_loss           | 2.91e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.94e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 126         |
|    time_elapsed         | 1765        |
|    total_timesteps      | 258048      |
| train/                  |             |
|    approx_kl            | 0.011430523 |
|    clip_fraction        | 0.108       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.07e+04    |
|    n_updates            | 1250        |
|    policy_gradient_loss | 0.000287    |
|    std                  | 0.78        |
|    value_loss           | 4.04e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.94e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 127         |
|    time_elapsed         | 1780        |
|    total_timesteps      | 260096      |
| train/                  |             |
|    approx_kl            | 0.012471996 |
|    clip_fraction        | 0.0835      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 6.54e+04    |
|    n_updates            | 1260        |
|    policy_gradient_loss | -0.00831    |
|    std                  | 0.784       |
|    value_loss           | 1.33e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.95e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 128         |
|    time_elapsed         | 1794        |
|    total_timesteps      | 262144      |
| train/                  |             |
|    approx_kl            | 0.008992329 |
|    clip_fraction        | 0.0826      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.44e+04    |
|    n_updates            | 1270        |
|    policy_gradient_loss | -0.000448   |
|    std                  | 0.791       |
|    value_loss           | 3.41e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.96e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 129         |
|    time_elapsed         | 1808        |
|    total_timesteps      | 264192      |
| train/                  |             |
|    approx_kl            | 0.011706731 |
|    clip_fraction        | 0.13        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.73e+04    |
|    n_updates            | 1280        |
|    policy_gradient_loss | -0.00362    |
|    std                  | 0.785       |
|    value_loss           | 5.66e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 1.98e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 130         |
|    time_elapsed         | 1822        |
|    total_timesteps      | 266240      |
| train/                  |             |
|    approx_kl            | 0.013437878 |
|    clip_fraction        | 0.155       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.45e+04    |
|    n_updates            | 1290        |
|    policy_gradient_loss | -0.000298   |
|    std                  | 0.788       |
|    value_loss           | 6.05e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2e+04       |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 131         |
|    time_elapsed         | 1835        |
|    total_timesteps      | 268288      |
| train/                  |             |
|    approx_kl            | 0.006905757 |
|    clip_fraction        | 0.0843      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8.57e+04    |
|    n_updates            | 1300        |
|    policy_gradient_loss | -0.0066     |
|    std                  | 0.79        |
|    value_loss           | 1.43e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.03e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 132         |
|    time_elapsed         | 1849        |
|    total_timesteps      | 270336      |
| train/                  |             |
|    approx_kl            | 0.010834164 |
|    clip_fraction        | 0.129       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.93e+04    |
|    n_updates            | 1310        |
|    policy_gradient_loss | -0.00354    |
|    std                  | 0.786       |
|    value_loss           | 4.28e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.03e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 133         |
|    time_elapsed         | 1862        |
|    total_timesteps      | 272384      |
| train/                  |             |
|    approx_kl            | 0.009356933 |
|    clip_fraction        | 0.118       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 5.64e+04    |
|    n_updates            | 1320        |
|    policy_gradient_loss | -0.000485   |
|    std                  | 0.79        |
|    value_loss           | 1.04e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.04e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 134         |
|    time_elapsed         | 1876        |
|    total_timesteps      | 274432      |
| train/                  |             |
|    approx_kl            | 0.017256424 |
|    clip_fraction        | 0.203       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.22e+04    |
|    n_updates            | 1330        |
|    policy_gradient_loss | 0.000761    |
|    std                  | 0.79        |
|    value_loss           | 1.97e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.07e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 135         |
|    time_elapsed         | 1890        |
|    total_timesteps      | 276480      |
| train/                  |             |
|    approx_kl            | 0.016726445 |
|    clip_fraction        | 0.161       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 2.15e+04    |
|    n_updates            | 1340        |
|    policy_gradient_loss | -0.0122     |
|    std                  | 0.791       |
|    value_loss           | 4.34e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.12e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 136         |
|    time_elapsed         | 1904        |
|    total_timesteps      | 278528      |
| train/                  |             |
|    approx_kl            | 0.010385685 |
|    clip_fraction        | 0.0725      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 5.79e+04    |
|    n_updates            | 1350        |
|    policy_gradient_loss | -0.00434    |
|    std                  | 0.792       |
|    value_loss           | 1.09e+05    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.14e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 137         |
|    time_elapsed         | 1918        |
|    total_timesteps      | 280576      |
| train/                  |             |
|    approx_kl            | 0.007573339 |
|    clip_fraction        | 0.0746      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.96e+05    |
|    n_updates            | 1360        |
|    policy_gradient_loss | -0.00349    |
|    std                  | 0.787       |
|    value_loss           | 3.02e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 138          |
|    time_elapsed         | 1931         |
|    total_timesteps      | 282624       |
| train/                  |              |
|    approx_kl            | 0.0070940517 |
|    clip_fraction        | 0.061        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.37        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 5.67e+04     |
|    n_updates            | 1370         |
|    policy_gradient_loss | -0.00315     |
|    std                  | 0.793        |
|    value_loss           | 1.01e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.2e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 139         |
|    time_elapsed         | 1945        |
|    total_timesteps      | 284672      |
| train/                  |             |
|    approx_kl            | 0.014831897 |
|    clip_fraction        | 0.139       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 5.4e+04     |
|    n_updates            | 1380        |
|    policy_gradient_loss | -0.0122     |
|    std                  | 0.788       |
|    value_loss           | 9.77e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.22e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 140         |
|    time_elapsed         | 1959        |
|    total_timesteps      | 286720      |
| train/                  |             |
|    approx_kl            | 0.009213081 |
|    clip_fraction        | 0.0839      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.25e+05    |
|    n_updates            | 1390        |
|    policy_gradient_loss | -0.00645    |
|    std                  | 0.791       |
|    value_loss           | 1.94e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.26e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 141         |
|    time_elapsed         | 1972        |
|    total_timesteps      | 288768      |
| train/                  |             |
|    approx_kl            | 0.006149709 |
|    clip_fraction        | 0.0662      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8e+04       |
|    n_updates            | 1400        |
|    policy_gradient_loss | -0.00861    |
|    std                  | 0.788       |
|    value_loss           | 1.55e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.29e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 142         |
|    time_elapsed         | 1986        |
|    total_timesteps      | 290816      |
| train/                  |             |
|    approx_kl            | 0.006930629 |
|    clip_fraction        | 0.0487      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 5.58e+04    |
|    n_updates            | 1410        |
|    policy_gradient_loss | -0.00344    |
|    std                  | 0.788       |
|    value_loss           | 1.27e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.32e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 143        |
|    time_elapsed         | 2001       |
|    total_timesteps      | 292864     |
| train/                  |            |
|    approx_kl            | 0.02277663 |
|    clip_fraction        | 0.25       |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.36      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 8.34e+04   |
|    n_updates            | 1420       |
|    policy_gradient_loss | 0.000407   |
|    std                  | 0.787      |
|    value_loss           | 1.83e+05   |
----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.32e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 144         |
|    time_elapsed         | 2015        |
|    total_timesteps      | 294912      |
| train/                  |             |
|    approx_kl            | 0.008937445 |
|    clip_fraction        | 0.0673      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.12e+05    |
|    n_updates            | 1430        |
|    policy_gradient_loss | -0.0128     |
|    std                  | 0.787       |
|    value_loss           | 2.2e+05     |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 145         |
|    time_elapsed         | 2029        |
|    total_timesteps      | 296960      |
| train/                  |             |
|    approx_kl            | 0.018521799 |
|    clip_fraction        | 0.169       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.56e+04    |
|    n_updates            | 1440        |
|    policy_gradient_loss | 0.00163     |
|    std                  | 0.791       |
|    value_loss           | 2.76e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.37e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 146         |
|    time_elapsed         | 2043        |
|    total_timesteps      | 299008      |
| train/                  |             |
|    approx_kl            | 0.009504773 |
|    clip_fraction        | 0.0929      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.37       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 4.66e+04    |
|    n_updates            | 1450        |
|    policy_gradient_loss | -0.0122     |
|    std                  | 0.791       |
|    value_loss           | 1.29e+05    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.39e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 147         |
|    time_elapsed         | 2057        |
|    total_timesteps      | 301056      |
| train/                  |             |
|    approx_kl            | 0.010224592 |
|    clip_fraction        | 0.0879      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.36       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 5.47e+04    |
|    n_updates            | 1460        |
|    policy_gradient_loss | -0.011      |
|    std                  | 0.786       |
|    value_loss           | 1.05e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.39e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 148          |
|    time_elapsed         | 2071         |
|    total_timesteps      | 303104       |
| train/                  |              |
|    approx_kl            | 0.0090159215 |
|    clip_fraction        | 0.0808       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.35        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 3.04e+04     |
|    n_updates            | 1470         |
|    policy_gradient_loss | -0.00925     |
|    std                  | 0.784        |
|    value_loss           | 7.15e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.4e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 149         |
|    time_elapsed         | 2086        |
|    total_timesteps      | 305152      |
| train/                  |             |
|    approx_kl            | 0.012324146 |
|    clip_fraction        | 0.104       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.34       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.83e+04    |
|    n_updates            | 1480        |
|    policy_gradient_loss | -0.00913    |
|    std                  | 0.778       |
|    value_loss           | 6.28e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.44e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 150         |
|    time_elapsed         | 2100        |
|    total_timesteps      | 307200      |
| train/                  |             |
|    approx_kl            | 0.021044672 |
|    clip_fraction        | 0.224       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 2.7e+04     |
|    n_updates            | 1490        |
|    policy_gradient_loss | 0.00276     |
|    std                  | 0.769       |
|    value_loss           | 6.01e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.45e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 151         |
|    time_elapsed         | 2114        |
|    total_timesteps      | 309248      |
| train/                  |             |
|    approx_kl            | 0.010620867 |
|    clip_fraction        | 0.0963      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.31       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.11e+05    |
|    n_updates            | 1500        |
|    policy_gradient_loss | -0.00823    |
|    std                  | 0.768       |
|    value_loss           | 1.93e+05    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.45e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 152         |
|    time_elapsed         | 2128        |
|    total_timesteps      | 311296      |
| train/                  |             |
|    approx_kl            | 0.009820145 |
|    clip_fraction        | 0.0984      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.57e+04    |
|    n_updates            | 1510        |
|    policy_gradient_loss | -0.00385    |
|    std                  | 0.774       |
|    value_loss           | 4.87e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.47e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 153         |
|    time_elapsed         | 2141        |
|    total_timesteps      | 313344      |
| train/                  |             |
|    approx_kl            | 0.039277826 |
|    clip_fraction        | 0.188       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 4.78e+04    |
|    n_updates            | 1520        |
|    policy_gradient_loss | 0.00633     |
|    std                  | 0.772       |
|    value_loss           | 1.02e+05    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.47e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 154         |
|    time_elapsed         | 2155        |
|    total_timesteps      | 315392      |
| train/                  |             |
|    approx_kl            | 0.022092113 |
|    clip_fraction        | 0.17        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.24e+04    |
|    n_updates            | 1530        |
|    policy_gradient_loss | 0.00478     |
|    std                  | 0.772       |
|    value_loss           | 5.83e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.5e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 155         |
|    time_elapsed         | 2168        |
|    total_timesteps      | 317440      |
| train/                  |             |
|    approx_kl            | 0.010579394 |
|    clip_fraction        | 0.125       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.14e+04    |
|    n_updates            | 1540        |
|    policy_gradient_loss | -0.0027     |
|    std                  | 0.774       |
|    value_loss           | 4.66e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.49e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 156         |
|    time_elapsed         | 2183        |
|    total_timesteps      | 319488      |
| train/                  |             |
|    approx_kl            | 0.010778338 |
|    clip_fraction        | 0.0829      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.32       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 5.97e+04    |
|    n_updates            | 1550        |
|    policy_gradient_loss | -0.00432    |
|    std                  | 0.772       |
|    value_loss           | 1.23e+05    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.49e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 157         |
|    time_elapsed         | 2197        |
|    total_timesteps      | 321536      |
| train/                  |             |
|    approx_kl            | 0.017274696 |
|    clip_fraction        | 0.183       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.33       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 8.04e+03    |
|    n_updates            | 1560        |
|    policy_gradient_loss | 0.000794    |
|    std                  | 0.783       |
|    value_loss           | 1.86e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.48e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 158         |
|    time_elapsed         | 2211        |
|    total_timesteps      | 323584      |
| train/                  |             |
|    approx_kl            | 0.034241498 |
|    clip_fraction        | 0.183       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.35       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 5.16e+03    |
|    n_updates            | 1570        |
|    policy_gradient_loss | 0.00284     |
|    std                  | 0.786       |
|    value_loss           | 1.15e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 1.2e+03   |
|    ep_rew_mean          | 2.48e+04  |
| time/                   |           |
|    fps                  | 146       |
|    iterations           | 159       |
|    time_elapsed         | 2225      |
|    total_timesteps      | 325632    |
| train/                  |           |
|    approx_kl            | 0.3389376 |
|    clip_fraction        | 0.471     |
|    clip_range           | 0.2       |
|    entropy_loss         | -2.43     |
|    explained_variance   | 0         |
|    learning_rate        | 0.0003    |
|    loss                 | 1.96e+03  |
|    n_updates            | 1580      |
|    policy_gradient_loss | 0.019     |
|    std                  | 0.835     |
|    value_loss           | 9.1e+03   |
---------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.48e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 160         |
|    time_elapsed         | 2239        |
|    total_timesteps      | 327680      |
| train/                  |             |
|    approx_kl            | 0.005281109 |
|    clip_fraction        | 0.0663      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | 1.19e-07    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.78e+04    |
|    n_updates            | 1590        |
|    policy_gradient_loss | -0.00419    |
|    std                  | 0.837       |
|    value_loss           | 3.84e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.48e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 161         |
|    time_elapsed         | 2253        |
|    total_timesteps      | 329728      |
| train/                  |             |
|    approx_kl            | 0.005753454 |
|    clip_fraction        | 0.085       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 4.91e+03    |
|    n_updates            | 1600        |
|    policy_gradient_loss | 0.000773    |
|    std                  | 0.835       |
|    value_loss           | 1.32e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.5e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 162          |
|    time_elapsed         | 2267         |
|    total_timesteps      | 331776       |
| train/                  |              |
|    approx_kl            | 0.0048351064 |
|    clip_fraction        | 0.0298       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.47        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.47e+04     |
|    n_updates            | 1610         |
|    policy_gradient_loss | -0.0025      |
|    std                  | 0.834        |
|    value_loss           | 5.31e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.51e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 163          |
|    time_elapsed         | 2280         |
|    total_timesteps      | 333824       |
| train/                  |              |
|    approx_kl            | 0.0068735047 |
|    clip_fraction        | 0.059        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.47        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.23e+04     |
|    n_updates            | 1620         |
|    policy_gradient_loss | -0.00626     |
|    std                  | 0.834        |
|    value_loss           | 7.44e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.51e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 164         |
|    time_elapsed         | 2294        |
|    total_timesteps      | 335872      |
| train/                  |             |
|    approx_kl            | 0.009292517 |
|    clip_fraction        | 0.0956      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.75e+04    |
|    n_updates            | 1630        |
|    policy_gradient_loss | -0.0124     |
|    std                  | 0.832       |
|    value_loss           | 2.73e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.52e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 165          |
|    time_elapsed         | 2308         |
|    total_timesteps      | 337920       |
| train/                  |              |
|    approx_kl            | 0.0064372486 |
|    clip_fraction        | 0.0664       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 2.31e+04     |
|    n_updates            | 1640         |
|    policy_gradient_loss | -0.0029      |
|    std                  | 0.83         |
|    value_loss           | 5.65e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.54e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 166          |
|    time_elapsed         | 2322         |
|    total_timesteps      | 339968       |
| train/                  |              |
|    approx_kl            | 0.0118397325 |
|    clip_fraction        | 0.183        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.12e+04     |
|    n_updates            | 1650         |
|    policy_gradient_loss | 0.00627      |
|    std                  | 0.833        |
|    value_loss           | 1.55e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.55e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 167         |
|    time_elapsed         | 2337        |
|    total_timesteps      | 342016      |
| train/                  |             |
|    approx_kl            | 0.003156255 |
|    clip_fraction        | 0.0204      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.47       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 8.21e+04    |
|    n_updates            | 1660        |
|    policy_gradient_loss | -0.000906   |
|    std                  | 0.833       |
|    value_loss           | 1.49e+05    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.57e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 168          |
|    time_elapsed         | 2351         |
|    total_timesteps      | 344064       |
| train/                  |              |
|    approx_kl            | 0.0041007777 |
|    clip_fraction        | 0.0239       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.47        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 4.92e+04     |
|    n_updates            | 1670         |
|    policy_gradient_loss | -0.00197     |
|    std                  | 0.832        |
|    value_loss           | 8.43e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.58e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 169          |
|    time_elapsed         | 2365         |
|    total_timesteps      | 346112       |
| train/                  |              |
|    approx_kl            | 0.0029526413 |
|    clip_fraction        | 0.0184       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.47        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 6.44e+04     |
|    n_updates            | 1680         |
|    policy_gradient_loss | -0.00202     |
|    std                  | 0.833        |
|    value_loss           | 1.13e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.58e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 170         |
|    time_elapsed         | 2379        |
|    total_timesteps      | 348160      |
| train/                  |             |
|    approx_kl            | 0.007881822 |
|    clip_fraction        | 0.0965      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.46       |
|    explained_variance   | -2.38e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 9.15e+03    |
|    n_updates            | 1690        |
|    policy_gradient_loss | -0.00135    |
|    std                  | 0.823       |
|    value_loss           | 2.51e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.58e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 171          |
|    time_elapsed         | 2393         |
|    total_timesteps      | 350208       |
| train/                  |              |
|    approx_kl            | 0.0045934375 |
|    clip_fraction        | 0.0451       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 2.02e+04     |
|    n_updates            | 1700         |
|    policy_gradient_loss | 7.48e-05     |
|    std                  | 0.825        |
|    value_loss           | 4.4e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 1.2e+03   |
|    ep_rew_mean          | 2.59e+04  |
| time/                   |           |
|    fps                  | 146       |
|    iterations           | 172       |
|    time_elapsed         | 2407      |
|    total_timesteps      | 352256    |
| train/                  |           |
|    approx_kl            | 0.0055109 |
|    clip_fraction        | 0.0672    |
|    clip_range           | 0.2       |
|    entropy_loss         | -2.44     |
|    explained_variance   | 5.96e-08  |
|    learning_rate        | 0.0003    |
|    loss                 | 1.64e+04  |
|    n_updates            | 1710      |
|    policy_gradient_loss | 0.00243   |
|    std                  | 0.821     |
|    value_loss           | 3.85e+04  |
---------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.62e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 173         |
|    time_elapsed         | 2421        |
|    total_timesteps      | 354304      |
| train/                  |             |
|    approx_kl            | 0.005828525 |
|    clip_fraction        | 0.0809      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.34e+04    |
|    n_updates            | 1720        |
|    policy_gradient_loss | 0.0044      |
|    std                  | 0.822       |
|    value_loss           | 3.74e+04    |
-----------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.62e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 174        |
|    time_elapsed         | 2435       |
|    total_timesteps      | 356352     |
| train/                  |            |
|    approx_kl            | 0.00395523 |
|    clip_fraction        | 0.0248     |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.44      |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 7.21e+04   |
|    n_updates            | 1730       |
|    policy_gradient_loss | -0.00267   |
|    std                  | 0.817      |
|    value_loss           | 1.65e+05   |
----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.63e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 175         |
|    time_elapsed         | 2449        |
|    total_timesteps      | 358400      |
| train/                  |             |
|    approx_kl            | 0.006548295 |
|    clip_fraction        | 0.0367      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.43       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.54e+04    |
|    n_updates            | 1740        |
|    policy_gradient_loss | -0.00366    |
|    std                  | 0.815       |
|    value_loss           | 2.5e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.63e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 176          |
|    time_elapsed         | 2463         |
|    total_timesteps      | 360448       |
| train/                  |              |
|    approx_kl            | 0.0050562853 |
|    clip_fraction        | 0.0362       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 3.59e+04     |
|    n_updates            | 1750         |
|    policy_gradient_loss | -0.00158     |
|    std                  | 0.81         |
|    value_loss           | 5.88e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.62e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 177         |
|    time_elapsed         | 2477        |
|    total_timesteps      | 362496      |
| train/                  |             |
|    approx_kl            | 0.046167284 |
|    clip_fraction        | 0.241       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 4.45e+03    |
|    n_updates            | 1760        |
|    policy_gradient_loss | 0.00491     |
|    std                  | 0.804       |
|    value_loss           | 1.21e+04    |
-----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.61e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 178         |
|    time_elapsed         | 2492        |
|    total_timesteps      | 364544      |
| train/                  |             |
|    approx_kl            | 0.016748011 |
|    clip_fraction        | 0.11        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.36e+03    |
|    n_updates            | 1770        |
|    policy_gradient_loss | -0.00313    |
|    std                  | 0.809       |
|    value_loss           | 1.6e+04     |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.65e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 179          |
|    time_elapsed         | 2506         |
|    total_timesteps      | 366592       |
| train/                  |              |
|    approx_kl            | 0.0056960853 |
|    clip_fraction        | 0.0494       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 2.12e+04     |
|    n_updates            | 1780         |
|    policy_gradient_loss | -0.00719     |
|    std                  | 0.809        |
|    value_loss           | 4.06e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.67e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 180          |
|    time_elapsed         | 2519         |
|    total_timesteps      | 368640       |
| train/                  |              |
|    approx_kl            | 0.0038355822 |
|    clip_fraction        | 0.017        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.16e+05     |
|    n_updates            | 1790         |
|    policy_gradient_loss | -0.00269     |
|    std                  | 0.81         |
|    value_loss           | 2.43e+05     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.71e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 181         |
|    time_elapsed         | 2534        |
|    total_timesteps      | 370688      |
| train/                  |             |
|    approx_kl            | 0.004950725 |
|    clip_fraction        | 0.0298      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 3.29e+04    |
|    n_updates            | 1800        |
|    policy_gradient_loss | -0.00428    |
|    std                  | 0.808       |
|    value_loss           | 9.81e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.69e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 182          |
|    time_elapsed         | 2548         |
|    total_timesteps      | 372736       |
| train/                  |              |
|    approx_kl            | 0.0062711835 |
|    clip_fraction        | 0.0457       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 9.28e+04     |
|    n_updates            | 1810         |
|    policy_gradient_loss | -0.00529     |
|    std                  | 0.804        |
|    value_loss           | 2.42e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.72e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 183        |
|    time_elapsed         | 2562       |
|    total_timesteps      | 374784     |
| train/                  |            |
|    approx_kl            | 0.03769949 |
|    clip_fraction        | 0.276      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.39      |
|    explained_variance   | -1.19e-07  |
|    learning_rate        | 0.0003     |
|    loss                 | 4.11e+03   |
|    n_updates            | 1820       |
|    policy_gradient_loss | 0.017      |
|    std                  | 0.803      |
|    value_loss           | 1.27e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.71e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 184          |
|    time_elapsed         | 2577         |
|    total_timesteps      | 376832       |
| train/                  |              |
|    approx_kl            | 0.0017561743 |
|    clip_fraction        | 0.0173       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.12e+05     |
|    n_updates            | 1830         |
|    policy_gradient_loss | -0.0024      |
|    std                  | 0.804        |
|    value_loss           | 2.6e+05      |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.72e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 185         |
|    time_elapsed         | 2591        |
|    total_timesteps      | 378880      |
| train/                  |             |
|    approx_kl            | 0.112695605 |
|    clip_fraction        | 0.332       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.72e+03    |
|    n_updates            | 1840        |
|    policy_gradient_loss | 0.0256      |
|    std                  | 0.814       |
|    value_loss           | 1.46e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.71e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 186          |
|    time_elapsed         | 2605         |
|    total_timesteps      | 380928       |
| train/                  |              |
|    approx_kl            | 0.0053791683 |
|    clip_fraction        | 0.0456       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 6.82e+04     |
|    n_updates            | 1850         |
|    policy_gradient_loss | -0.00408     |
|    std                  | 0.814        |
|    value_loss           | 1.39e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.7e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 187         |
|    time_elapsed         | 2619        |
|    total_timesteps      | 382976      |
| train/                  |             |
|    approx_kl            | 0.010274031 |
|    clip_fraction        | 0.294       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.42       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.92e+03    |
|    n_updates            | 1860        |
|    policy_gradient_loss | 0.0151      |
|    std                  | 0.809       |
|    value_loss           | 1.58e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.7e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 188          |
|    time_elapsed         | 2633         |
|    total_timesteps      | 385024       |
| train/                  |              |
|    approx_kl            | 0.0063446662 |
|    clip_fraction        | 0.0343       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.59e+04     |
|    n_updates            | 1870         |
|    policy_gradient_loss | -0.00318     |
|    std                  | 0.808        |
|    value_loss           | 5.11e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.69e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 189         |
|    time_elapsed         | 2647        |
|    total_timesteps      | 387072      |
| train/                  |             |
|    approx_kl            | 0.001311849 |
|    clip_fraction        | 0.00337     |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.88e+04    |
|    n_updates            | 1880        |
|    policy_gradient_loss | -0.0015     |
|    std                  | 0.808       |
|    value_loss           | 6.04e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.7e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 190          |
|    time_elapsed         | 2661         |
|    total_timesteps      | 389120       |
| train/                  |              |
|    approx_kl            | 0.0020473837 |
|    clip_fraction        | 0.00845      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.45e+04     |
|    n_updates            | 1890         |
|    policy_gradient_loss | -0.000309    |
|    std                  | 0.808        |
|    value_loss           | 3.35e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.68e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 191          |
|    time_elapsed         | 2675         |
|    total_timesteps      | 391168       |
| train/                  |              |
|    approx_kl            | 0.0038499257 |
|    clip_fraction        | 0.0162       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 6.08e+04     |
|    n_updates            | 1900         |
|    policy_gradient_loss | -0.00169     |
|    std                  | 0.809        |
|    value_loss           | 1.22e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.68e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 192          |
|    time_elapsed         | 2689         |
|    total_timesteps      | 393216       |
| train/                  |              |
|    approx_kl            | 0.0040635746 |
|    clip_fraction        | 0.0566       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 749          |
|    n_updates            | 1910         |
|    policy_gradient_loss | 0.00125      |
|    std                  | 0.8          |
|    value_loss           | 6.02e+03     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.69e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 193          |
|    time_elapsed         | 2703         |
|    total_timesteps      | 395264       |
| train/                  |              |
|    approx_kl            | 0.0049852952 |
|    clip_fraction        | 0.0297       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 4.81e+04     |
|    n_updates            | 1920         |
|    policy_gradient_loss | -0.00322     |
|    std                  | 0.798        |
|    value_loss           | 8.63e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.64e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 194          |
|    time_elapsed         | 2717         |
|    total_timesteps      | 397312       |
| train/                  |              |
|    approx_kl            | 0.0051691593 |
|    clip_fraction        | 0.0332       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.07e+05     |
|    n_updates            | 1930         |
|    policy_gradient_loss | -0.00202     |
|    std                  | 0.797        |
|    value_loss           | 2.04e+05     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.65e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 195         |
|    time_elapsed         | 2730        |
|    total_timesteps      | 399360      |
| train/                  |             |
|    approx_kl            | 0.029682703 |
|    clip_fraction        | 0.232       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.45e+03    |
|    n_updates            | 1940        |
|    policy_gradient_loss | 0.00683     |
|    std                  | 0.802       |
|    value_loss           | 1.23e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.65e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 196          |
|    time_elapsed         | 2745         |
|    total_timesteps      | 401408       |
| train/                  |              |
|    approx_kl            | 0.0015565101 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.25e+05     |
|    n_updates            | 1950         |
|    policy_gradient_loss | -0.000973    |
|    std                  | 0.803        |
|    value_loss           | 2.14e+05     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.61e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 197          |
|    time_elapsed         | 2759         |
|    total_timesteps      | 403456       |
| train/                  |              |
|    approx_kl            | 0.0031888187 |
|    clip_fraction        | 0.0339       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 3.59e+04     |
|    n_updates            | 1960         |
|    policy_gradient_loss | -0.00151     |
|    std                  | 0.799        |
|    value_loss           | 7.24e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.58e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 198          |
|    time_elapsed         | 2773         |
|    total_timesteps      | 405504       |
| train/                  |              |
|    approx_kl            | 0.0026603849 |
|    clip_fraction        | 0.0128       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.31e+04     |
|    n_updates            | 1970         |
|    policy_gradient_loss | -0.00043     |
|    std                  | 0.799        |
|    value_loss           | 1.3e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.54e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 199         |
|    time_elapsed         | 2786        |
|    total_timesteps      | 407552      |
| train/                  |             |
|    approx_kl            | 0.010369105 |
|    clip_fraction        | 0.222       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.18e+04    |
|    n_updates            | 1980        |
|    policy_gradient_loss | 0.00338     |
|    std                  | 0.811       |
|    value_loss           | 6.25e+03    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.52e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 200          |
|    time_elapsed         | 2800         |
|    total_timesteps      | 409600       |
| train/                  |              |
|    approx_kl            | 0.0053892815 |
|    clip_fraction        | 0.0947       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 9.45e+03     |
|    n_updates            | 1990         |
|    policy_gradient_loss | -0.00246     |
|    std                  | 0.809        |
|    value_loss           | 2.89e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.51e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 201          |
|    time_elapsed         | 2814         |
|    total_timesteps      | 411648       |
| train/                  |              |
|    approx_kl            | 0.0005793912 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.87e+04     |
|    n_updates            | 2000         |
|    policy_gradient_loss | -0.00027     |
|    std                  | 0.809        |
|    value_loss           | 7.86e+04     |
------------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.49e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 202           |
|    time_elapsed         | 2828          |
|    total_timesteps      | 413696        |
| train/                  |               |
|    approx_kl            | 0.00032858778 |
|    clip_fraction        | 9.77e-05      |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0             |
|    learning_rate        | 0.0003        |
|    loss                 | 3.17e+04      |
|    n_updates            | 2010          |
|    policy_gradient_loss | -0.000896     |
|    std                  | 0.809         |
|    value_loss           | 7.33e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.49e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 203          |
|    time_elapsed         | 2842         |
|    total_timesteps      | 415744       |
| train/                  |              |
|    approx_kl            | 0.0017202175 |
|    clip_fraction        | 0.00449      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -2.38e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.14e+04     |
|    n_updates            | 2020         |
|    policy_gradient_loss | -0.000631    |
|    std                  | 0.81         |
|    value_loss           | 2.05e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.45e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 204         |
|    time_elapsed         | 2856        |
|    total_timesteps      | 417792      |
| train/                  |             |
|    approx_kl            | 0.046429716 |
|    clip_fraction        | 0.167       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.88e+04    |
|    n_updates            | 2030        |
|    policy_gradient_loss | 0.00882     |
|    std                  | 0.804       |
|    value_loss           | 3.4e+04     |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.44e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 205          |
|    time_elapsed         | 2870         |
|    total_timesteps      | 419840       |
| train/                  |              |
|    approx_kl            | 0.0034502659 |
|    clip_fraction        | 0.109        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.39        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 9.04e+03     |
|    n_updates            | 2040         |
|    policy_gradient_loss | 0.00265      |
|    std                  | 0.797        |
|    value_loss           | 1.39e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.46e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 206          |
|    time_elapsed         | 2883         |
|    total_timesteps      | 421888       |
| train/                  |              |
|    approx_kl            | 0.0037220747 |
|    clip_fraction        | 0.0311       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.32e+04     |
|    n_updates            | 2050         |
|    policy_gradient_loss | -0.00105     |
|    std                  | 0.796        |
|    value_loss           | 5.83e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.44e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 207          |
|    time_elapsed         | 2897         |
|    total_timesteps      | 423936       |
| train/                  |              |
|    approx_kl            | 0.0004281234 |
|    clip_fraction        | 0.000293     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.38        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 3.34e+04     |
|    n_updates            | 2060         |
|    policy_gradient_loss | -0.000554    |
|    std                  | 0.796        |
|    value_loss           | 9.22e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.43e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 208         |
|    time_elapsed         | 2911        |
|    total_timesteps      | 425984      |
| train/                  |             |
|    approx_kl            | 0.028351426 |
|    clip_fraction        | 0.161       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.39       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 7.21e+03    |
|    n_updates            | 2070        |
|    policy_gradient_loss | 0.00645     |
|    std                  | 0.804       |
|    value_loss           | 1.54e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.41e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 209           |
|    time_elapsed         | 2926          |
|    total_timesteps      | 428032        |
| train/                  |               |
|    approx_kl            | 0.00055873254 |
|    clip_fraction        | 0.00405       |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.4          |
|    explained_variance   | 5.96e-08      |
|    learning_rate        | 0.0003        |
|    loss                 | 5.4e+04       |
|    n_updates            | 2080          |
|    policy_gradient_loss | 0.000205      |
|    std                  | 0.804         |
|    value_loss           | 9.32e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.41e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 210          |
|    time_elapsed         | 2940         |
|    total_timesteps      | 430080       |
| train/                  |              |
|    approx_kl            | 0.0024209775 |
|    clip_fraction        | 0.00566      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 5.19e+03     |
|    n_updates            | 2090         |
|    policy_gradient_loss | -0.000807    |
|    std                  | 0.804        |
|    value_loss           | 1.16e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.37e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 211           |
|    time_elapsed         | 2953          |
|    total_timesteps      | 432128        |
| train/                  |               |
|    approx_kl            | 0.00040300813 |
|    clip_fraction        | 0.00166       |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.4          |
|    explained_variance   | 0             |
|    learning_rate        | 0.0003        |
|    loss                 | 2.68e+04      |
|    n_updates            | 2100          |
|    policy_gradient_loss | -0.00108      |
|    std                  | 0.804         |
|    value_loss           | 6.24e+04      |
-------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.36e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 212         |
|    time_elapsed         | 2967        |
|    total_timesteps      | 434176      |
| train/                  |             |
|    approx_kl            | 0.015826616 |
|    clip_fraction        | 0.182       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 246         |
|    n_updates            | 2110        |
|    policy_gradient_loss | 0.00561     |
|    std                  | 0.808       |
|    value_loss           | 1.35e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.36e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 213         |
|    time_elapsed         | 2981        |
|    total_timesteps      | 436224      |
| train/                  |             |
|    approx_kl            | 0.012660749 |
|    clip_fraction        | 0.101       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 2.59e+03    |
|    n_updates            | 2120        |
|    policy_gradient_loss | 0.000261    |
|    std                  | 0.811       |
|    value_loss           | 1.27e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.34e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 214          |
|    time_elapsed         | 2995         |
|    total_timesteps      | 438272       |
| train/                  |              |
|    approx_kl            | 0.0036898132 |
|    clip_fraction        | 0.00488      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.2e+04      |
|    n_updates            | 2130         |
|    policy_gradient_loss | -0.00151     |
|    std                  | 0.812        |
|    value_loss           | 2.93e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 215          |
|    time_elapsed         | 3009         |
|    total_timesteps      | 440320       |
| train/                  |              |
|    approx_kl            | 0.0035534608 |
|    clip_fraction        | 0.0886       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.25e+03     |
|    n_updates            | 2140         |
|    policy_gradient_loss | 0.0017       |
|    std                  | 0.807        |
|    value_loss           | 1.61e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.34e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 216         |
|    time_elapsed         | 3023        |
|    total_timesteps      | 442368      |
| train/                  |             |
|    approx_kl            | 0.012538008 |
|    clip_fraction        | 0.15        |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.4        |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 3.45e+03    |
|    n_updates            | 2150        |
|    policy_gradient_loss | 9.65e-05    |
|    std                  | 0.809       |
|    value_loss           | 7.32e+03    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.35e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 217          |
|    time_elapsed         | 3037         |
|    total_timesteps      | 444416       |
| train/                  |              |
|    approx_kl            | 0.0019840915 |
|    clip_fraction        | 0.0177       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.000356    |
|    learning_rate        | 0.0003       |
|    loss                 | 2.69e+04     |
|    n_updates            | 2160         |
|    policy_gradient_loss | -0.000967    |
|    std                  | 0.809        |
|    value_loss           | 3.04e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 218         |
|    time_elapsed         | 3051        |
|    total_timesteps      | 446464      |
| train/                  |             |
|    approx_kl            | 0.001042171 |
|    clip_fraction        | 0.000781    |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.1e+04     |
|    n_updates            | 2170        |
|    policy_gradient_loss | -0.00139    |
|    std                  | 0.809       |
|    value_loss           | 3.16e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.35e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 219          |
|    time_elapsed         | 3065         |
|    total_timesteps      | 448512       |
| train/                  |              |
|    approx_kl            | 0.0033211915 |
|    clip_fraction        | 0.0119       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 1.18e+04     |
|    n_updates            | 2180         |
|    policy_gradient_loss | -0.00112     |
|    std                  | 0.81         |
|    value_loss           | 1.92e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.33e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 220         |
|    time_elapsed         | 3080        |
|    total_timesteps      | 450560      |
| train/                  |             |
|    approx_kl            | 0.003660666 |
|    clip_fraction        | 0.0357      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 5.96e-08    |
|    learning_rate        | 0.0003      |
|    loss                 | 4.07e+03    |
|    n_updates            | 2190        |
|    policy_gradient_loss | -1.56e-05   |
|    std                  | 0.809       |
|    value_loss           | 1.39e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 221          |
|    time_elapsed         | 3094         |
|    total_timesteps      | 452608       |
| train/                  |              |
|    approx_kl            | 0.0108067915 |
|    clip_fraction        | 0.129        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.08e+04     |
|    n_updates            | 2200         |
|    policy_gradient_loss | 0.00199      |
|    std                  | 0.806        |
|    value_loss           | 1.67e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 222          |
|    time_elapsed         | 3108         |
|    total_timesteps      | 454656       |
| train/                  |              |
|    approx_kl            | 0.0047326735 |
|    clip_fraction        | 0.0202       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 9.75e+03     |
|    n_updates            | 2210         |
|    policy_gradient_loss | -0.00268     |
|    std                  | 0.807        |
|    value_loss           | 2.33e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 223          |
|    time_elapsed         | 3122         |
|    total_timesteps      | 456704       |
| train/                  |              |
|    approx_kl            | 0.0014149009 |
|    clip_fraction        | 0.00132      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.72e+04     |
|    n_updates            | 2220         |
|    policy_gradient_loss | -0.00202     |
|    std                  | 0.807        |
|    value_loss           | 3.66e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.34e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 224          |
|    time_elapsed         | 3136         |
|    total_timesteps      | 458752       |
| train/                  |              |
|    approx_kl            | 0.0013034248 |
|    clip_fraction        | 0.0357       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 5.96e-08     |
|    learning_rate        | 0.0003       |
|    loss                 | 2.16e+04     |
|    n_updates            | 2230         |
|    policy_gradient_loss | 0.00152      |
|    std                  | 0.807        |
|    value_loss           | 2.69e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.32e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 225          |
|    time_elapsed         | 3150         |
|    total_timesteps      | 460800       |
| train/                  |              |
|    approx_kl            | 0.0039016686 |
|    clip_fraction        | 0.00903      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.09e+04     |
|    n_updates            | 2240         |
|    policy_gradient_loss | -0.00199     |
|    std                  | 0.807        |
|    value_loss           | 3.81e+04     |
------------------------------------------


INFO:root:done


---------------------------------------
| rollout/                |           |
|    ep_len_mean          | 1.2e+03   |
|    ep_rew_mean          | 2.32e+04  |
| time/                   |           |
|    fps                  | 146       |
|    iterations           | 226       |
|    time_elapsed         | 3165      |
|    total_timesteps      | 462848    |
| train/                  |           |
|    approx_kl            | 0.0084801 |
|    clip_fraction        | 0.13      |
|    clip_range           | 0.2       |
|    entropy_loss         | -2.4      |
|    explained_variance   | 1.19e-07  |
|    learning_rate        | 0.0003    |
|    loss                 | 6e+03     |
|    n_updates            | 2250      |
|    policy_gradient_loss | 0.00199   |
|    std                  | 0.808     |
|    value_loss           | 2.17e+04  |
---------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.31e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 227           |
|    time_elapsed         | 3179          |
|    total_timesteps      | 464896        |
| train/                  |               |
|    approx_kl            | 0.00023483767 |
|    clip_fraction        | 0.000146      |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0             |
|    learning_rate        | 0.0003        |
|    loss                 | 2.13e+04      |
|    n_updates            | 2260          |
|    policy_gradient_loss | -0.000311     |
|    std                  | 0.808         |
|    value_loss           | 4.64e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.32e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 228         |
|    time_elapsed         | 3194        |
|    total_timesteps      | 466944      |
| train/                  |             |
|    approx_kl            | 0.003948936 |
|    clip_fraction        | 0.0161      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.05e+04    |
|    n_updates            | 2270        |
|    policy_gradient_loss | -0.00127    |
|    std                  | 0.808       |
|    value_loss           | 2.96e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.32e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 229          |
|    time_elapsed         | 3207         |
|    total_timesteps      | 468992       |
| train/                  |              |
|    approx_kl            | 0.0038660553 |
|    clip_fraction        | 0.0431       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.15e+04     |
|    n_updates            | 2280         |
|    policy_gradient_loss | 0.000561     |
|    std                  | 0.812        |
|    value_loss           | 2.38e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.32e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 230          |
|    time_elapsed         | 3222         |
|    total_timesteps      | 471040       |
| train/                  |              |
|    approx_kl            | 0.0028741036 |
|    clip_fraction        | 0.00298      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.35e+04     |
|    n_updates            | 2290         |
|    policy_gradient_loss | -0.000437    |
|    std                  | 0.813        |
|    value_loss           | 3.84e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.33e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 231          |
|    time_elapsed         | 3236         |
|    total_timesteps      | 473088       |
| train/                  |              |
|    approx_kl            | 0.0040713735 |
|    clip_fraction        | 0.018        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.46e+04     |
|    n_updates            | 2300         |
|    policy_gradient_loss | -0.00247     |
|    std                  | 0.811        |
|    value_loss           | 4.17e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.33e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 232         |
|    time_elapsed         | 3249        |
|    total_timesteps      | 475136      |
| train/                  |             |
|    approx_kl            | 0.003803351 |
|    clip_fraction        | 0.0143      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 2.13e+04    |
|    n_updates            | 2310        |
|    policy_gradient_loss | -0.00162    |
|    std                  | 0.81        |
|    value_loss           | 5.85e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 233         |
|    time_elapsed         | 3264        |
|    total_timesteps      | 477184      |
| train/                  |             |
|    approx_kl            | 0.003550175 |
|    clip_fraction        | 0.00645     |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 3.27e+04    |
|    n_updates            | 2320        |
|    policy_gradient_loss | -0.00135    |
|    std                  | 0.808       |
|    value_loss           | 9.78e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.35e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 234         |
|    time_elapsed         | 3278        |
|    total_timesteps      | 479232      |
| train/                  |             |
|    approx_kl            | 0.004422415 |
|    clip_fraction        | 0.0224      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.78e+04    |
|    n_updates            | 2330        |
|    policy_gradient_loss | -0.00225    |
|    std                  | 0.81        |
|    value_loss           | 4.07e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.38e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 235         |
|    time_elapsed         | 3292        |
|    total_timesteps      | 481280      |
| train/                  |             |
|    approx_kl            | 0.005243501 |
|    clip_fraction        | 0.0271      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.19e-07   |
|    learning_rate        | 0.0003      |
|    loss                 | 2.62e+04    |
|    n_updates            | 2340        |
|    policy_gradient_loss | -0.00261    |
|    std                  | 0.808       |
|    value_loss           | 6.23e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.38e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 236          |
|    time_elapsed         | 3307         |
|    total_timesteps      | 483328       |
| train/                  |              |
|    approx_kl            | 0.0031656963 |
|    clip_fraction        | 0.00898      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -1.19e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 3.83e+04     |
|    n_updates            | 2350         |
|    policy_gradient_loss | -0.00145     |
|    std                  | 0.805        |
|    value_loss           | 8.18e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.38e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 237        |
|    time_elapsed         | 3321       |
|    total_timesteps      | 485376     |
| train/                  |            |
|    approx_kl            | 0.02401856 |
|    clip_fraction        | 0.148      |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.4       |
|    explained_variance   | 0          |
|    learning_rate        | 0.0003     |
|    loss                 | 4.8e+03    |
|    n_updates            | 2360       |
|    policy_gradient_loss | 0.00311    |
|    std                  | 0.807      |
|    value_loss           | 1.74e+04   |
----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.34e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 238          |
|    time_elapsed         | 3335         |
|    total_timesteps      | 487424       |
| train/                  |              |
|    approx_kl            | 0.0060438355 |
|    clip_fraction        | 0.0741       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.06e+04     |
|    n_updates            | 2370         |
|    policy_gradient_loss | -0.00169     |
|    std                  | 0.807        |
|    value_loss           | 3.13e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.33e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 239         |
|    time_elapsed         | 3349        |
|    total_timesteps      | 489472      |
| train/                  |             |
|    approx_kl            | 0.018512787 |
|    clip_fraction        | 0.191       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.81e+03    |
|    n_updates            | 2380        |
|    policy_gradient_loss | 0.00743     |
|    std                  | 0.81        |
|    value_loss           | 1.83e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.3e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 240          |
|    time_elapsed         | 3363         |
|    total_timesteps      | 491520       |
| train/                  |              |
|    approx_kl            | 0.0036351169 |
|    clip_fraction        | 0.00693      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.18e+04     |
|    n_updates            | 2390         |
|    policy_gradient_loss | 0.000194     |
|    std                  | 0.811        |
|    value_loss           | 1.35e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.29e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 241          |
|    time_elapsed         | 3378         |
|    total_timesteps      | 493568       |
| train/                  |              |
|    approx_kl            | 0.0012722991 |
|    clip_fraction        | 0.0724       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | -2.38e-07    |
|    learning_rate        | 0.0003       |
|    loss                 | 4.58e+03     |
|    n_updates            | 2400         |
|    policy_gradient_loss | 0.00193      |
|    std                  | 0.821        |
|    value_loss           | 1.83e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.26e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 242         |
|    time_elapsed         | 3391        |
|    total_timesteps      | 495616      |
| train/                  |             |
|    approx_kl            | 0.007410402 |
|    clip_fraction        | 0.127       |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | 0           |
|    learning_rate        | 0.0003      |
|    loss                 | 1.23e+04    |
|    n_updates            | 2410        |
|    policy_gradient_loss | -8.05e-05   |
|    std                  | 0.82        |
|    value_loss           | 1.77e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.26e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 243          |
|    time_elapsed         | 3406         |
|    total_timesteps      | 497664       |
| train/                  |              |
|    approx_kl            | 0.0041202432 |
|    clip_fraction        | 0.0963       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 2.45e+03     |
|    n_updates            | 2420         |
|    policy_gradient_loss | 0.00295      |
|    std                  | 0.816        |
|    value_loss           | 1.72e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.24e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 244          |
|    time_elapsed         | 3419         |
|    total_timesteps      | 499712       |
| train/                  |              |
|    approx_kl            | 0.0060717333 |
|    clip_fraction        | 0.0815       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.42        |
|    explained_variance   | 0            |
|    learning_rate        | 0.0003       |
|    loss                 | 1.66e+03     |
|    n_updates            | 2430         |
|    policy_gradient_loss | 0.00202      |
|    std                  | 0.809        |
|    value_loss           | 1.02e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.23e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 245         |
|    time_elapsed         | 3433        |
|    total_timesteps      | 501760      |
| train/                  |             |
|    approx_kl            | 0.009494521 |
|    clip_fraction        | 0.0968      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -1.67e-06   |
|    learning_rate        | 0.0003      |
|    loss                 | 1.33e+04    |
|    n_updates            | 2440        |
|    policy_gradient_loss | 0.00231     |
|    std                  | 0.808       |
|    value_loss           | 2.07e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.23e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 246          |
|    time_elapsed         | 3447         |
|    total_timesteps      | 503808       |
| train/                  |              |
|    approx_kl            | 0.0074363374 |
|    clip_fraction        | 0.113        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 1.19e-07     |
|    learning_rate        | 0.0003       |
|    loss                 | 4.9e+03      |
|    n_updates            | 2450         |
|    policy_gradient_loss | -0.00458     |
|    std                  | 0.809        |
|    value_loss           | 1.94e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.22e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 247           |
|    time_elapsed         | 3462          |
|    total_timesteps      | 505856        |
| train/                  |               |
|    approx_kl            | 0.00016550135 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.0293        |
|    learning_rate        | 0.0003        |
|    loss                 | 1.98e+03      |
|    n_updates            | 2460          |
|    policy_gradient_loss | -0.000727     |
|    std                  | 0.809         |
|    value_loss           | 1.2e+04       |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.22e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 248          |
|    time_elapsed         | 3476         |
|    total_timesteps      | 507904       |
| train/                  |              |
|    approx_kl            | 7.399553e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.00365      |
|    learning_rate        | 0.0003       |
|    loss                 | 3.81e+03     |
|    n_updates            | 2470         |
|    policy_gradient_loss | -0.00032     |
|    std                  | 0.809        |
|    value_loss           | 1.85e+04     |
------------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.2e+04       |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 249           |
|    time_elapsed         | 3491          |
|    total_timesteps      | 509952        |
| train/                  |               |
|    approx_kl            | 3.3023127e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.0456        |
|    learning_rate        | 0.0003        |
|    loss                 | 5.78e+03      |
|    n_updates            | 2480          |
|    policy_gradient_loss | -0.000183     |
|    std                  | 0.809         |
|    value_loss           | 1.76e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.2e+04       |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 250           |
|    time_elapsed         | 3506          |
|    total_timesteps      | 512000        |
| train/                  |               |
|    approx_kl            | 0.00059629336 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.0449        |
|    learning_rate        | 0.0003        |
|    loss                 | 2.57e+03      |
|    n_updates            | 2490          |
|    policy_gradient_loss | -0.00111      |
|    std                  | 0.809         |
|    value_loss           | 1.22e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 251          |
|    time_elapsed         | 3519         |
|    total_timesteps      | 514048       |
| train/                  |              |
|    approx_kl            | 0.0009990113 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.0359      |
|    learning_rate        | 0.0003       |
|    loss                 | 812          |
|    n_updates            | 2500         |
|    policy_gradient_loss | -0.00156     |
|    std                  | 0.809        |
|    value_loss           | 1.52e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.17e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 252          |
|    time_elapsed         | 3533         |
|    total_timesteps      | 516096       |
| train/                  |              |
|    approx_kl            | 0.0003530182 |
|    clip_fraction        | 4.88e-05     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.0463       |
|    learning_rate        | 0.0003       |
|    loss                 | 892          |
|    n_updates            | 2510         |
|    policy_gradient_loss | -0.000284    |
|    std                  | 0.809        |
|    value_loss           | 1.64e+04     |
------------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.18e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 253           |
|    time_elapsed         | 3547          |
|    total_timesteps      | 518144        |
| train/                  |               |
|    approx_kl            | 0.00089185615 |
|    clip_fraction        | 0.000879      |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.103         |
|    learning_rate        | 0.0003        |
|    loss                 | 2.46e+03      |
|    n_updates            | 2520          |
|    policy_gradient_loss | -0.000789     |
|    std                  | 0.809         |
|    value_loss           | 1.8e+04       |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.13e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 254          |
|    time_elapsed         | 3561         |
|    total_timesteps      | 520192       |
| train/                  |              |
|    approx_kl            | 0.0028053296 |
|    clip_fraction        | 0.00186      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.368        |
|    learning_rate        | 0.0003       |
|    loss                 | 9.63e+03     |
|    n_updates            | 2530         |
|    policy_gradient_loss | -0.000788    |
|    std                  | 0.81         |
|    value_loss           | 1.33e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.14e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 255          |
|    time_elapsed         | 3575         |
|    total_timesteps      | 522240       |
| train/                  |              |
|    approx_kl            | 0.0039466303 |
|    clip_fraction        | 0.0203       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.0361      |
|    learning_rate        | 0.0003       |
|    loss                 | 2.19e+03     |
|    n_updates            | 2540         |
|    policy_gradient_loss | 0.000274     |
|    std                  | 0.809        |
|    value_loss           | 1.9e+04      |
------------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.15e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 256           |
|    time_elapsed         | 3589          |
|    total_timesteps      | 524288        |
| train/                  |               |
|    approx_kl            | 0.00028643274 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.41         |
|    explained_variance   | 0.0213        |
|    learning_rate        | 0.0003        |
|    loss                 | 6.52e+03      |
|    n_updates            | 2550          |
|    policy_gradient_loss | 8.64e-05      |
|    std                  | 0.809         |
|    value_loss           | 1.88e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 257          |
|    time_elapsed         | 3603         |
|    total_timesteps      | 526336       |
| train/                  |              |
|    approx_kl            | 0.0022042603 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.089       |
|    learning_rate        | 0.0003       |
|    loss                 | 775          |
|    n_updates            | 2560         |
|    policy_gradient_loss | -0.000991    |
|    std                  | 0.809        |
|    value_loss           | 8.67e+03     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.15e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 258          |
|    time_elapsed         | 3617         |
|    total_timesteps      | 528384       |
| train/                  |              |
|    approx_kl            | 0.0015742909 |
|    clip_fraction        | 9.77e-05     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.00236      |
|    learning_rate        | 0.0003       |
|    loss                 | 2.01e+04     |
|    n_updates            | 2570         |
|    policy_gradient_loss | -0.000447    |
|    std                  | 0.809        |
|    value_loss           | 2.96e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.15e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 259          |
|    time_elapsed         | 3631         |
|    total_timesteps      | 530432       |
| train/                  |              |
|    approx_kl            | 0.0011505384 |
|    clip_fraction        | 4.88e-05     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.0671       |
|    learning_rate        | 0.0003       |
|    loss                 | 5.94e+03     |
|    n_updates            | 2580         |
|    policy_gradient_loss | 5.33e-05     |
|    std                  | 0.81         |
|    value_loss           | 2.46e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.15e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 260          |
|    time_elapsed         | 3645         |
|    total_timesteps      | 532480       |
| train/                  |              |
|    approx_kl            | 0.0020698789 |
|    clip_fraction        | 0.00186      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.0463       |
|    learning_rate        | 0.0003       |
|    loss                 | 3.04e+04     |
|    n_updates            | 2590         |
|    policy_gradient_loss | -0.000916    |
|    std                  | 0.808        |
|    value_loss           | 3.13e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.15e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 261          |
|    time_elapsed         | 3659         |
|    total_timesteps      | 534528       |
| train/                  |              |
|    approx_kl            | 0.0019356541 |
|    clip_fraction        | 0.000439     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | 0.105        |
|    learning_rate        | 0.0003       |
|    loss                 | 3.13e+04     |
|    n_updates            | 2600         |
|    policy_gradient_loss | -0.00123     |
|    std                  | 0.809        |
|    value_loss           | 3.38e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.16e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 262         |
|    time_elapsed         | 3673        |
|    total_timesteps      | 536576      |
| train/                  |             |
|    approx_kl            | 0.002667516 |
|    clip_fraction        | 0.00283     |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0.0638      |
|    learning_rate        | 0.0003      |
|    loss                 | 1.07e+04    |
|    n_updates            | 2610        |
|    policy_gradient_loss | -0.000874   |
|    std                  | 0.808       |
|    value_loss           | 2.81e+04    |
-----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 263          |
|    time_elapsed         | 3687         |
|    total_timesteps      | 538624       |
| train/                  |              |
|    approx_kl            | 0.0012219141 |
|    clip_fraction        | 4.88e-05     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.00145     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.06e+03     |
|    n_updates            | 2620         |
|    policy_gradient_loss | -0.000616    |
|    std                  | 0.808        |
|    value_loss           | 1.75e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.17e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 264         |
|    time_elapsed         | 3700        |
|    total_timesteps      | 540672      |
| train/                  |             |
|    approx_kl            | 0.005010533 |
|    clip_fraction        | 0.0207      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | -0.147      |
|    learning_rate        | 0.0003      |
|    loss                 | 7.37e+03    |
|    n_updates            | 2630        |
|    policy_gradient_loss | -0.00171    |
|    std                  | 0.806       |
|    value_loss           | 1.31e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.17e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 265          |
|    time_elapsed         | 3714         |
|    total_timesteps      | 542720       |
| train/                  |              |
|    approx_kl            | 0.0048290873 |
|    clip_fraction        | 0.0277       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.4         |
|    explained_variance   | -0.00296     |
|    learning_rate        | 0.0003       |
|    loss                 | 3.21e+04     |
|    n_updates            | 2640         |
|    policy_gradient_loss | -0.00252     |
|    std                  | 0.805        |
|    value_loss           | 4.99e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.18e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 266         |
|    time_elapsed         | 3727        |
|    total_timesteps      | 544768      |
| train/                  |             |
|    approx_kl            | 0.003666722 |
|    clip_fraction        | 0.0182      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.41       |
|    explained_variance   | 0.000949    |
|    learning_rate        | 0.0003      |
|    loss                 | 1.45e+04    |
|    n_updates            | 2650        |
|    policy_gradient_loss | -0.00188    |
|    std                  | 0.807       |
|    value_loss           | 4.53e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.17e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 267          |
|    time_elapsed         | 3741         |
|    total_timesteps      | 546816       |
| train/                  |              |
|    approx_kl            | 0.0023065237 |
|    clip_fraction        | 0.00718      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.41        |
|    explained_variance   | -0.0564      |
|    learning_rate        | 0.0003       |
|    loss                 | 1.37e+04     |
|    n_updates            | 2660         |
|    policy_gradient_loss | -0.00142     |
|    std                  | 0.806        |
|    value_loss           | 3.46e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.19e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 268          |
|    time_elapsed         | 3755         |
|    total_timesteps      | 548864       |
| train/                  |              |
|    approx_kl            | 0.0022016664 |
|    clip_fraction        | 0.0953       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 1.13e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 9.75e+03     |
|    n_updates            | 2670         |
|    policy_gradient_loss | 0.00357      |
|    std                  | 0.818        |
|    value_loss           | 2.46e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.2e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 269          |
|    time_elapsed         | 3769         |
|    total_timesteps      | 550912       |
| train/                  |              |
|    approx_kl            | 0.0034754355 |
|    clip_fraction        | 0.00435      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.44        |
|    explained_variance   | 5.17e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 1.39e+04     |
|    n_updates            | 2680         |
|    policy_gradient_loss | -0.000553    |
|    std                  | 0.821        |
|    value_loss           | 4.52e+04     |
------------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.2e+04     |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 270         |
|    time_elapsed         | 3783        |
|    total_timesteps      | 552960      |
| train/                  |             |
|    approx_kl            | 0.003219577 |
|    clip_fraction        | 0.0194      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | 8.4e-06     |
|    learning_rate        | 0.0003      |
|    loss                 | 1.15e+04    |
|    n_updates            | 2690        |
|    policy_gradient_loss | -0.00137    |
|    std                  | 0.824       |
|    value_loss           | 3.43e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.21e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 271          |
|    time_elapsed         | 3797         |
|    total_timesteps      | 555008       |
| train/                  |              |
|    approx_kl            | 0.0036321243 |
|    clip_fraction        | 0.0465       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | -2e-05       |
|    learning_rate        | 0.0003       |
|    loss                 | 6.58e+03     |
|    n_updates            | 2700         |
|    policy_gradient_loss | 0.00056      |
|    std                  | 0.825        |
|    value_loss           | 1.69e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.21e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 272          |
|    time_elapsed         | 3811         |
|    total_timesteps      | 557056       |
| train/                  |              |
|    approx_kl            | 0.0023997384 |
|    clip_fraction        | 0.0219       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | 3.99e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 5.82e+03     |
|    n_updates            | 2710         |
|    policy_gradient_loss | -0.000638    |
|    std                  | 0.83         |
|    value_loss           | 2.49e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.21e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 273          |
|    time_elapsed         | 3825         |
|    total_timesteps      | 559104       |
| train/                  |              |
|    approx_kl            | 0.0010495745 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | 0.014        |
|    learning_rate        | 0.0003       |
|    loss                 | 2.08e+04     |
|    n_updates            | 2720         |
|    policy_gradient_loss | -0.000137    |
|    std                  | 0.829        |
|    value_loss           | 3.1e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.23e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 274          |
|    time_elapsed         | 3838         |
|    total_timesteps      | 561152       |
| train/                  |              |
|    approx_kl            | 0.0056377756 |
|    clip_fraction        | 0.0311       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | -0.013       |
|    learning_rate        | 0.0003       |
|    loss                 | 5.11e+03     |
|    n_updates            | 2730         |
|    policy_gradient_loss | -0.00175     |
|    std                  | 0.826        |
|    value_loss           | 1.65e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.23e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 275          |
|    time_elapsed         | 3852         |
|    total_timesteps      | 563200       |
| train/                  |              |
|    approx_kl            | 0.0036554735 |
|    clip_fraction        | 0.0174       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | 1.42e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 5.65e+03     |
|    n_updates            | 2740         |
|    policy_gradient_loss | 1.51e-05     |
|    std                  | 0.824        |
|    value_loss           | 2.55e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.22e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 276         |
|    time_elapsed         | 3866        |
|    total_timesteps      | 565248      |
| train/                  |             |
|    approx_kl            | 0.004131675 |
|    clip_fraction        | 0.0364      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | -7.01e-05   |
|    learning_rate        | 0.0003      |
|    loss                 | 5.43e+03    |
|    n_updates            | 2750        |
|    policy_gradient_loss | -0.00184    |
|    std                  | 0.823       |
|    value_loss           | 2.59e+04    |
-----------------------------------------


INFO:root:done


-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.22e+04      |
| time/                   |               |
|    fps                  | 146           |
|    iterations           | 277           |
|    time_elapsed         | 3880          |
|    total_timesteps      | 567296        |
| train/                  |               |
|    approx_kl            | 0.00059960736 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -2.45         |
|    explained_variance   | -0.00831      |
|    learning_rate        | 0.0003        |
|    loss                 | 1.94e+04      |
|    n_updates            | 2760          |
|    policy_gradient_loss | 0.000218      |
|    std                  | 0.824         |
|    value_loss           | 2.32e+04      |
-------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.22e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 278          |
|    time_elapsed         | 3894         |
|    total_timesteps      | 569344       |
| train/                  |              |
|    approx_kl            | 0.0057934704 |
|    clip_fraction        | 0.0404       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | -0.0353      |
|    learning_rate        | 0.0003       |
|    loss                 | 1.35e+03     |
|    n_updates            | 2770         |
|    policy_gradient_loss | -0.00238     |
|    std                  | 0.824        |
|    value_loss           | 1.19e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.23e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 279        |
|    time_elapsed         | 3907       |
|    total_timesteps      | 571392     |
| train/                  |            |
|    approx_kl            | 0.00539076 |
|    clip_fraction        | 0.00923    |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.45      |
|    explained_variance   | 0.0833     |
|    learning_rate        | 0.0003     |
|    loss                 | 1.64e+04   |
|    n_updates            | 2780       |
|    policy_gradient_loss | -0.00117   |
|    std                  | 0.824      |
|    value_loss           | 2.48e+04   |
----------------------------------------


INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.23e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 280         |
|    time_elapsed         | 3921        |
|    total_timesteps      | 573440      |
| train/                  |             |
|    approx_kl            | 0.002605407 |
|    clip_fraction        | 0.00332     |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.45       |
|    explained_variance   | -0.0198     |
|    learning_rate        | 0.0003      |
|    loss                 | 3.57e+03    |
|    n_updates            | 2790        |
|    policy_gradient_loss | 0.000197    |
|    std                  | 0.823       |
|    value_loss           | 2.22e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.23e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 281          |
|    time_elapsed         | 3935         |
|    total_timesteps      | 575488       |
| train/                  |              |
|    approx_kl            | 0.0006279402 |
|    clip_fraction        | 0.00107      |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.45        |
|    explained_variance   | -0.0259      |
|    learning_rate        | 0.0003       |
|    loss                 | 3.65e+03     |
|    n_updates            | 2800         |
|    policy_gradient_loss | -0.000513    |
|    std                  | 0.823        |
|    value_loss           | 1.46e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.23e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 282         |
|    time_elapsed         | 3949        |
|    total_timesteps      | 577536      |
| train/                  |             |
|    approx_kl            | 0.007987397 |
|    clip_fraction        | 0.0717      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | -0.0385     |
|    learning_rate        | 0.0003      |
|    loss                 | 1.87e+04    |
|    n_updates            | 2810        |
|    policy_gradient_loss | -0.0041     |
|    std                  | 0.819       |
|    value_loss           | 3.21e+04    |
-----------------------------------------


INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.23e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 283        |
|    time_elapsed         | 3963       |
|    total_timesteps      | 579584     |
| train/                  |            |
|    approx_kl            | 0.00377094 |
|    clip_fraction        | 0.00957    |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.43      |
|    explained_variance   | 0.0229     |
|    learning_rate        | 0.0003     |
|    loss                 | 1.95e+04   |
|    n_updates            | 2820       |
|    policy_gradient_loss | -0.00148   |
|    std                  | 0.816      |
|    value_loss           | 4.5e+04    |
----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.24e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 284          |
|    time_elapsed         | 3976         |
|    total_timesteps      | 581632       |
| train/                  |              |
|    approx_kl            | 0.0011386602 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 0.0991       |
|    learning_rate        | 0.0003       |
|    loss                 | 2.85e+03     |
|    n_updates            | 2830         |
|    policy_gradient_loss | 5.24e-05     |
|    std                  | 0.818        |
|    value_loss           | 1.3e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.24e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 285          |
|    time_elapsed         | 3990         |
|    total_timesteps      | 583680       |
| train/                  |              |
|    approx_kl            | 0.0019187813 |
|    clip_fraction        | 0.0155       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.44        |
|    explained_variance   | -0.0882      |
|    learning_rate        | 0.0003       |
|    loss                 | 8.84e+03     |
|    n_updates            | 2840         |
|    policy_gradient_loss | -0.000212    |
|    std                  | 0.824        |
|    value_loss           | 5.12e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.2e+03    |
|    ep_rew_mean          | 2.24e+04   |
| time/                   |            |
|    fps                  | 146        |
|    iterations           | 286        |
|    time_elapsed         | 4004       |
|    total_timesteps      | 585728     |
| train/                  |            |
|    approx_kl            | 0.01504888 |
|    clip_fraction        | 0.0872     |
|    clip_range           | 0.2        |
|    entropy_loss         | -2.46      |
|    explained_variance   | 4.35e-05   |
|    learning_rate        | 0.0003     |
|    loss                 | 1.23e+04   |
|    n_updates            | 2850       |
|    policy_gradient_loss | -0.00333   |
|    std                  | 0.832      |
|    value_loss           | 4.46e+04   |
----------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.24e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 287          |
|    time_elapsed         | 4018         |
|    total_timesteps      | 587776       |
| train/                  |              |
|    approx_kl            | 0.0076972907 |
|    clip_fraction        | 0.135        |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.46        |
|    explained_variance   | 2.38e-05     |
|    learning_rate        | 0.0003       |
|    loss                 | 2.52e+04     |
|    n_updates            | 2860         |
|    policy_gradient_loss | -0.00125     |
|    std                  | 0.823        |
|    value_loss           | 3.46e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.22e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 288         |
|    time_elapsed         | 4032        |
|    total_timesteps      | 589824      |
| train/                  |             |
|    approx_kl            | 0.004189547 |
|    clip_fraction        | 0.0371      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.44       |
|    explained_variance   | 1.03e-05    |
|    learning_rate        | 0.0003      |
|    loss                 | 909         |
|    n_updates            | 2870        |
|    policy_gradient_loss | 0.000601    |
|    std                  | 0.817       |
|    value_loss           | 1.12e+04    |
-----------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.21e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 289          |
|    time_elapsed         | 4046         |
|    total_timesteps      | 591872       |
| train/                  |              |
|    approx_kl            | 0.0027379526 |
|    clip_fraction        | 0.000928     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.44        |
|    explained_variance   | 0.000245     |
|    learning_rate        | 0.0003       |
|    loss                 | 1.69e+04     |
|    n_updates            | 2880         |
|    policy_gradient_loss | -0.000259    |
|    std                  | 0.818        |
|    value_loss           | 1.93e+04     |
------------------------------------------


INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.2e+04      |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 290          |
|    time_elapsed         | 4060         |
|    total_timesteps      | 593920       |
| train/                  |              |
|    approx_kl            | 0.0006894174 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.44        |
|    explained_variance   | -0.0175      |
|    learning_rate        | 0.0003       |
|    loss                 | 5.21e+03     |
|    n_updates            | 2890         |
|    policy_gradient_loss | -7.45e-05    |
|    std                  | 0.819        |
|    value_loss           | 2.67e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.17e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 291          |
|    time_elapsed         | 4074         |
|    total_timesteps      | 595968       |
| train/                  |              |
|    approx_kl            | 0.0019507715 |
|    clip_fraction        | 0.000439     |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 0.0564       |
|    learning_rate        | 0.0003       |
|    loss                 | 7.47e+03     |
|    n_updates            | 2900         |
|    policy_gradient_loss | -9.65e-05    |
|    std                  | 0.816        |
|    value_loss           | 2.17e+04     |
------------------------------------------


INFO:root:done
INFO:root:done


------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.16e+04     |
| time/                   |              |
|    fps                  | 146          |
|    iterations           | 292          |
|    time_elapsed         | 4088         |
|    total_timesteps      | 598016       |
| train/                  |              |
|    approx_kl            | 0.0066675055 |
|    clip_fraction        | 0.0463       |
|    clip_range           | 0.2          |
|    entropy_loss         | -2.43        |
|    explained_variance   | 0.0459       |
|    learning_rate        | 0.0003       |
|    loss                 | 1.51e+04     |
|    n_updates            | 2910         |
|    policy_gradient_loss | -0.000112    |
|    std                  | 0.813        |
|    value_loss           | 1.8e+04      |
------------------------------------------


INFO:root:done
INFO:root:done


-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.14e+04    |
| time/                   |             |
|    fps                  | 146         |
|    iterations           | 293         |
|    time_elapsed         | 4101        |
|    total_timesteps      | 600064      |
| train/                  |             |
|    approx_kl            | 0.004999628 |
|    clip_fraction        | 0.0658      |
|    clip_range           | 0.2         |
|    entropy_loss         | -2.42       |
|    explained_variance   | 0.0206      |
|    learning_rate        | 0.0003      |
|    loss                 | 2.29e+03    |
|    n_updates            | 2920        |
|    policy_gradient_loss | -0.00384    |
|    std                  | 0.809       |
|    value_loss           | 2.1e+04     |
-----------------------------------------


### Optuna


In [8]:
env.close()


In [None]:
# Importing the optimzation frame - HPO
import optuna
# PPO algo for RL
from stable_baselines3 import PPO
# Bring in the eval policy method for metric calculation
from stable_baselines3.common.evaluation import evaluate_policy

# Import the vec wrappers to vectorize and frame stack
from stable_baselines3.common.vec_env import DummyVecEnv, VecFrameStack
# Import os to deal with filepaths
import os


# Function to return test hyperparameters - define the object function

now = datetime.now().strftime('%Y-%m-%d_%H%M')

LOG_DIR = './train/logs/' + now + '/'
OPT_DIR = './train/opt/'+ now + '/'

def optimize_ppo(trial): 
    return {
        'n_steps':trial.suggest_int('n_steps', 256, 8192, 64),
        'gamma':trial.suggest_loguniform('gamma', 0.8, 0.9999),
        'learning_rate':trial.suggest_loguniform('learning_rate', 1e-5, 1e-2),
        'clip_range':trial.suggest_uniform('clip_range', 0.1, 0.4),
        'gae_lambda':trial.suggest_uniform('gae_lambda', 0.8, 0.99)
    }
    
SAVE_PATH = os.path.join(OPT_DIR, 'trial_{}_best_model'.format(1))

# Run a training loop and return mean reward 
def optimize_agent(trial):
    
    # Get hyperparameters
    model_params = optimize_ppo(trial) 

    # Create environment 
    # env = SimpleWalk2DDynGoal()
    # env = Monitor(env)
    # env = DummyVecEnv([lambda: env])
    # env = VecFrameStack(env, 4, channels_order='last')

    # Create algo 
    model = PPO(
        'MlpPolicy', 
        env, 
        tensorboard_log=LOG_DIR, 
        verbose=0, 
        **model_params)
    model.learn(total_timesteps=100_000)
    #model.learn(total_timesteps=100000)

    # Evaluate model 
    mean_reward, _ = evaluate_policy(model, env, n_eval_episodes=30)
    env.close()

    SAVE_PATH = os.path.join(OPT_DIR, 'trial_{}_best_model'.format(trial.number))
    model.save(SAVE_PATH)

    return mean_reward

    
# Creating the experiment 
study = optuna.create_study(direction='maximize')
study.optimize(
    optimize_agent, 
    n_trials=1_000,
    timeout=60*60*12,
    show_progress_bar=True,
    )
#study.optimize(optimize_agent, n_trials=100, n_jobs=1)

study.best_params

study.best_trial

#model = PPO.load(os.path.join(OPT_DIR, 'trial_5_best_model.zip'))

print('Finished', datetime.now().strftime('%Y-%m-%d_%H%M'))

In [None]:
study.best_params


In [None]:
study.best_trial.number

In [None]:
import plotly

In [None]:

# if optuna.visualization.is_available():
from plotly.offline import init_notebook_mode, iplot
init_notebook_mode(connected=True)
fig = optuna.visualization.plot_parallel_coordinate(study)
fig.show()

In [None]:
if optuna.visualization.is_available():
    fig = optuna.visualization.plot_param_importances(study)
    fig.show()

In [None]:
import joblib
joblib.dump(study, OPT_DIR + 'study.pkl')

In [None]:
load_path = os.path.join(OPT_DIR, 'trial_{}_best_model.zip'.format(study.best_trial.number))

# model = PPO('MlpPolicy', env, tensorboard_log=LOG_DIR, verbose=0, **study.best_params)

# env = SimpleWalk2DDynGoal()
# print(env.observation_space)
# env = Monitor(env)

model = PPO.load(
    path = load_path,
    env = env,
    )

print(model.action_space)
print(model.observation_space)


In [None]:
model

In [None]:
model.learn(
    total_timesteps=500_000, 
    callback=TrainAndLoggingCallback(
        check_freq=10_000, 
        save_path=LOG_DIR
        )
    )

In [None]:
"""
env_name = 'SW2DDynGoal'

CHECKPOINT_DIR = './train/train_' + env_name
LOG_DIR = './train/log_' + env_name

callback = TrainAndLoggingCallback(check_freq=10_000, save_path=CHECKPOINT_DIR)

log_path = os.path.join('Training', 'Logs')

model = PPO(
    "MlpPolicy", 
    env, 
    verbose=0, 
    tensorboard_log=log_path,
    #learning_rate=0.0001,
    #n_steps =2048
    )
logger.setLevel(logging.INFO)

model.learn(
    total_timesteps=300_000, 
    callback = callback
    )

model.save('PPO')

logger.setLevel(logging.DEBUG)
"""

## Test Model

In [None]:
# from stable_baselines3 import PPO
# from SimpleWalk2D import SimpleWalk2DDynGoal

#env = SimpleWalk2DDynGoal()


In [19]:

# test prediction
logger.setLevel(logging.DEBUG)

env = CarlaWalkerEnv(verbose=False, host=read_IP_from_file(file_name='../ip-host.txt'))
env.max_tick_count = 20*60
env = Monitor(env)

episodes = 10
for episode in range(episodes):
    env.reset()

    while True:
        action, _states = model.predict(env.observation)
        obs, rewards, done, info = env.step(action)
        if done:
            print('done')
            print("info", info)
            break
    env.render()
    
env.close()

DEBUG:root:waiting for server
DEBUG:root:server connected
INFO:root:We want to use Town01, but the map is named Carla/Maps/Town10HD_Opt


IP: 137.250.121.29


INFO:root:Map Carla/Maps/Town01 loaded
DEBUG:root:spawning walker at Location(x=88.619980, y=285.393005, z=0.300000)
DEBUG:root:created walker.pedestrian.0012
DEBUG:root:created sensor.camera.semantic_segmentation
DEBUG:root:render per default during init
DEBUG:root:rendering
DEBUG:root:tick in reset


AttributeError: 'CarlaWalkerEnv' object has no attribute 'state'

DEBUG:root:=== creating observation ===
DEBUG:root:=== observation created ===
DEBUG:root:=== creating observation ===
DEBUG:root:=== observation created ===


In [7]:
from stable_baselines3.common.evaluation import evaluate_policy

evaluate_policy(model, env, n_eval_episodes=10, render=False)

# TODO render doesn't work

INFO:root:done
INFO:root:done
INFO:root:done
INFO:root:done
INFO:root:done
INFO:root:done
INFO:root:done
INFO:root:done
INFO:root:done
INFO:root:done


(6768.83109, 910.1836190940685)