### Import Required Libraries

In [1]:
!pip install gym_super_mario_bros==7.3.0 nes_py
# Install pytorch
!pip install torch==1.10.1+cu113 torchvision==0.11.2+cu113 torchaudio===0.10.1+cu113 -f https://download.pytorch.org/whl/cu113/torch_stable.html
# Installation of stable baselines for Reinforced Learning
!pip install stable-baselines3[extra]

Collecting gym_super_mario_bros==7.3.0
  Downloading gym_super_mario_bros-7.3.0-py2.py3-none-any.whl (198 kB)
Collecting nes_py
  Downloading nes_py-8.1.8.tar.gz (76 kB)
Collecting gym>=0.17.2
  Downloading gym-0.23.1.tar.gz (626 kB)
  Installing build dependencies: started
  Installing build dependencies: finished with status 'done'
  Getting requirements to build wheel: started
  Getting requirements to build wheel: finished with status 'done'
    Preparing wheel metadata: started
    Preparing wheel metadata: finished with status 'done'
Collecting pyglet<=1.5.11,>=1.4.0
  Downloading pyglet-1.5.11-py3-none-any.whl (1.1 MB)
Collecting gym-notices>=0.0.4
  Downloading gym_notices-0.0.6-py3-none-any.whl (2.7 kB)
Collecting importlib-metadata>=4.10.0
  Downloading importlib_metadata-4.11.4-py3-none-any.whl (18 kB)
Building wheels for collected packages: nes-py, gym
  Building wheel for nes-py (setup.py): started
  Building wheel for nes-py (setup.py): finished with status 'done'
  Creat

In [2]:
# importing the game from gym
import gym_super_mario_bros
# next was to import Joypad wrapper
from nes_py.wrappers import JoypadSpace
# Followed by SIMPLIFIED controls
from gym_super_mario_bros.actions import SIMPLE_MOVEMENT
# Importing os for management of file path
import os 
# Import PPO, DQN, Gail as RL learning agents
from stable_baselines3 import PPO
from stable_baselines3 import DQN
from stable_baselines3 import A2C
# Import Base Callback to save models
from stable_baselines3.common.callbacks import BaseCallback

### Setup Mario

In [3]:
# Setting up the game
env = gym_super_mario_bros.make('SuperMarioBros-v0')
env = JoypadSpace(env, SIMPLE_MOVEMENT)

### Train the RL Model

In [4]:
class TrainAndLoggingCallback(BaseCallback):

    def __init__(self, freq_check, store_path, verbose=1):
        super(TrainAndLoggingCallback, self).__init__(verbose)
        self.freq_check = freq_check
        self.store_path = store_path

    def _init_callback(self):
        if self.store_path is not None:
            os.makedirs(self.store_path, exist_ok=True)

    def _on_step(self):
        if self.n_calls % self.freq_check == 0:
            model_path = os.path.join(self.store_path, 'best_model_{}'.format(self.n_calls))
            self.model.save(model_path)

        return True

In [5]:
CHECKPOINT_DIR = './train/'
LOG_DIR = './logs/'

In [6]:
# Setup model saving callback
callback = TrainAndLoggingCallback(freq_check=10000, store_path=CHECKPOINT_DIR)

In [7]:
# This is the AI model started
model = PPO('MlpPolicy', env, verbose=1, tensorboard_log=LOG_DIR, learning_rate=0.000001, seed = 20,
             n_steps = 256)

Using cuda device
Wrapping the env with a `Monitor` wrapper
Wrapping the env in a DummyVecEnv.
Wrapping the env in a VecTransposeImage.


In [8]:
# Train the AI model, this is where the AI model starts to learn
model.learn(total_timesteps=2000000, callback=callback)

Logging to ./logs/PPO_2


  return (self.ram[0x86] - self.ram[0x071c]) % 256


----------------------------
| time/              |     |
|    fps             | 106 |
|    iterations      | 1   |
|    time_elapsed    | 2   |
|    total_timesteps | 256 |
----------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 118           |
|    iterations           | 2             |
|    time_elapsed         | 4             |
|    total_timesteps      | 512           |
| train/                  |               |
|    approx_kl            | 1.3248064e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.95         |
|    explained_variance   | 0.00752       |
|    learning_rate        | 1e-06         |
|    loss                 | 189           |
|    n_updates            | 10            |
|    policy_gradient_loss | -2.9e-05      |
|    value_loss           | 446           |
-------------------------------------------
-----

-----------------------------------------
| time/                   |             |
|    fps                  | 132         |
|    iterations           | 13          |
|    time_elapsed         | 25          |
|    total_timesteps      | 3328        |
| train/                  |             |
|    approx_kl            | 9.64175e-06 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.95       |
|    explained_variance   | -0.000123   |
|    learning_rate        | 1e-06       |
|    loss                 | 0.2         |
|    n_updates            | 120         |
|    policy_gradient_loss | -0.000408   |
|    value_loss           | 0.44        |
-----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 132           |
|    iterations           | 14            |
|    time_elapsed         | 26            |
|    total_timesteps    

-------------------------------------------
| time/                   |               |
|    fps                  | 134           |
|    iterations           | 24            |
|    time_elapsed         | 45            |
|    total_timesteps      | 6144          |
| train/                  |               |
|    approx_kl            | 1.5781261e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.95         |
|    explained_variance   | 0.000799      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.128         |
|    n_updates            | 230           |
|    policy_gradient_loss | -0.000103     |
|    value_loss           | 0.185         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 134          |
|    iterations           | 25           |
|    time_elapsed         | 47      

-------------------------------------------
| time/                   |               |
|    fps                  | 134           |
|    iterations           | 35            |
|    time_elapsed         | 66            |
|    total_timesteps      | 8960          |
| train/                  |               |
|    approx_kl            | 1.9115396e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.95         |
|    explained_variance   | 1.48e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.178         |
|    n_updates            | 340           |
|    policy_gradient_loss | -2.26e-05     |
|    value_loss           | 0.364         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 134           |
|    iterations           | 36            |
|    time_elapsed         | 68  

------------------------------------------
| time/                   |              |
|    fps                  | 133          |
|    iterations           | 46           |
|    time_elapsed         | 88           |
|    total_timesteps      | 11776        |
| train/                  |              |
|    approx_kl            | 5.818438e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.95        |
|    explained_variance   | 6.34e-05     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.12         |
|    n_updates            | 450          |
|    policy_gradient_loss | -3.98e-05    |
|    value_loss           | 0.269        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 47            |
|    time_elapsed         | 90            |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 57            |
|    time_elapsed         | 109           |
|    total_timesteps      | 14592         |
| train/                  |               |
|    approx_kl            | 5.2070245e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.95         |
|    explained_variance   | -5.96e-07     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0507        |
|    n_updates            | 560           |
|    policy_gradient_loss | -0.000262     |
|    value_loss           | 0.139         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 58            |
|    time_elapsed         | 111 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 511          |
| time/                   |              |
|    fps                  | 133          |
|    iterations           | 67           |
|    time_elapsed         | 128          |
|    total_timesteps      | 17152        |
| train/                  |              |
|    approx_kl            | 8.200295e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.95        |
|    explained_variance   | -0.000165    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.152        |
|    n_updates            | 660          |
|    policy_gradient_loss | -8.94e-05    |
|    value_loss           | 0.272        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 511          |
| time/                   |              |
|    fps                  | 134          |
|    iterations           | 76           |
|    time_elapsed         | 145          |
|    total_timesteps      | 19456        |
| train/                  |              |
|    approx_kl            | 9.806827e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.95        |
|    explained_variance   | 6.99e-05     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0853       |
|    n_updates            | 750          |
|    policy_gradient_loss | -5.83e-05    |
|    value_loss           | 0.166        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 511           |
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 85            |
|    time_elapsed         | 162           |
|    total_timesteps      | 21760         |
| train/                  |               |
|    approx_kl            | 1.4924444e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.000464     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.107         |
|    n_updates            | 840           |
|    policy_gradient_loss | -0.000113     |
|    value_loss           | 0.197         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 511           |
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 94            |
|    time_elapsed         | 179           |
|    total_timesteps      | 24064         |
| train/                  |               |
|    approx_kl            | 1.1001248e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.0111       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0559        |
|    n_updates            | 930           |
|    policy_gradient_loss | -3.86e-05     |
|    value_loss           | 0.114         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 511           |
| time/                   |               |
|    fps                  | 134           |
|    iterations           | 103           |
|    time_elapsed         | 196           |
|    total_timesteps      | 26368         |
| train/                  |               |
|    approx_kl            | 1.0787044e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.00168       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0848        |
|    n_updates            | 1020          |
|    policy_gradient_loss | -8.29e-05     |
|    value_loss           | 0.248         |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 511          |
| time/                   |              |
|    fps                  | 134          |
|    iterations           | 113          |
|    time_elapsed         | 215          |
|    total_timesteps      | 28928        |
| train/                  |              |
|    approx_kl            | 9.781215e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | 5.9e-06      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.123        |
|    n_updates            | 1120         |
|    policy_gradient_loss | -3.42e-05    |
|    value_loss           | 0.278        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 511           |
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 122           |
|    time_elapsed         | 233           |
|    total_timesteps      | 31232         |
| train/                  |               |
|    approx_kl            | 1.0260846e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.00342      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.113         |
|    n_updates            | 1210          |
|    policy_gradient_loss | -5.35e-05     |
|    value_loss           | 0.281         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 511           |
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 131           |
|    time_elapsed         | 250           |
|    total_timesteps      | 33536         |
| train/                  |               |
|    approx_kl            | 1.0721618e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -6.96e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.123         |
|    n_updates            | 1300          |
|    policy_gradient_loss | -0.000575     |
|    value_loss           | 0.218         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 511           |
| time/                   |               |
|    fps                  | 134           |
|    iterations           | 140           |
|    time_elapsed         | 267           |
|    total_timesteps      | 35840         |
| train/                  |               |
|    approx_kl            | 2.4655601e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.00324      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.101         |
|    n_updates            | 1390          |
|    policy_gradient_loss | -0.000428     |
|    value_loss           | 0.193         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 511           |
| time/                   |               |
|    fps                  | 134           |
|    iterations           | 149           |
|    time_elapsed         | 284           |
|    total_timesteps      | 38144         |
| train/                  |               |
|    approx_kl            | 4.5814086e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.00398      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0904        |
|    n_updates            | 1480          |
|    policy_gradient_loss | -0.000251     |
|    value_loss           | 0.171         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 2.01e+04     |
|    ep_rew_mean          | 512          |
| time/                   |              |
|    fps                  | 133          |
|    iterations           | 158          |
|    time_elapsed         | 302          |
|    total_timesteps      | 40448        |
| train/                  |              |
|    approx_kl            | 8.074567e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | -0.00013     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.106        |
|    n_updates            | 1570         |
|    policy_gradient_loss | -3.54e-05    |
|    value_loss           | 0.189        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.01e+04      |
|    ep_rew_mean          | 512           |
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 167           |
|    time_elapsed         | 319           |
|    total_timesteps      | 42752         |
| train/                  |               |
|    approx_kl            | 4.3120235e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.00919      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0585        |
|    n_updates            | 1660          |
|    policy_gradient_loss | -4e-05        |
|    value_loss           | 0.149         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.01e+04      |
|    ep_rew_mean          | 512           |
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 176           |
|    time_elapsed         | 336           |
|    total_timesteps      | 45056         |
| train/                  |               |
|    approx_kl            | 6.4540654e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.00341       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0702        |
|    n_updates            | 1750          |
|    policy_gradient_loss | -6.56e-05     |
|    value_loss           | 0.152         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 2.01e+04   |
|    ep_rew_mean          | 512        |
| time/                   |            |
|    fps                  | 133        |
|    iterations           | 185        |
|    time_elapsed         | 353        |
|    total_timesteps      | 47360      |
| train/                  |            |
|    approx_kl            | 1.5995e-05 |
|    clip_fraction        | 0          |
|    clip_range           | 0.2        |
|    entropy_loss         | -1.94      |
|    explained_variance   | 0.00132    |
|    learning_rate        | 1e-06      |
|    loss                 | 0.13       |
|    n_updates            | 1840       |
|    policy_gradient_loss | -0.000624  |
|    value_loss           | 0.226      |
----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 2.01e+04    |
|    ep_rew_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.01e+04      |
|    ep_rew_mean          | 512           |
| time/                   |               |
|    fps                  | 133           |
|    iterations           | 195           |
|    time_elapsed         | 373           |
|    total_timesteps      | 49920         |
| train/                  |               |
|    approx_kl            | 1.1612428e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.0018        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.115         |
|    n_updates            | 1940          |
|    policy_gradient_loss | -0.000301     |
|    value_loss           | 0.257         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 2.01e+04    |
|    ep_rew_mean          | 512         |
| time/                   |             |
|    fps                  | 133         |
|    iterations           | 204         |
|    time_elapsed         | 390         |
|    total_timesteps      | 52224       |
| train/                  |             |
|    approx_kl            | 2.20933e-06 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.94       |
|    explained_variance   | 0.000247    |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0974      |
|    n_updates            | 2030        |
|    policy_gradient_loss | -5.2e-05    |
|    value_loss           | 0.191       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 2.01e+04     |
|    ep_rew_mean          | 512          |
| time/                   |              |
|    fps                  | 133          |
|    iterations           | 214          |
|    time_elapsed         | 408          |
|    total_timesteps      | 54784        |
| train/                  |              |
|    approx_kl            | 4.554633e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | 0.00432      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0671       |
|    n_updates            | 2130         |
|    policy_gradient_loss | -0.000226    |
|    value_loss           | 0.156        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.01e+04      |
|    ep_rew_mean          | 512           |
| time/                   |               |
|    fps                  | 134           |
|    iterations           | 224           |
|    time_elapsed         | 426           |
|    total_timesteps      | 57344         |
| train/                  |               |
|    approx_kl            | 1.7969869e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.000433      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0582        |
|    n_updates            | 2230          |
|    policy_gradient_loss | -0.000121     |
|    value_loss           | 0.163         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.01e+04      |
|    ep_rew_mean          | 512           |
| time/                   |               |
|    fps                  | 134           |
|    iterations           | 233           |
|    time_elapsed         | 442           |
|    total_timesteps      | 59648         |
| train/                  |               |
|    approx_kl            | 2.4042092e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.0197       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.084         |
|    n_updates            | 2320          |
|    policy_gradient_loss | -8.15e-05     |
|    value_loss           | 0.148         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 2.01e+04     |
|    ep_rew_mean          | 512          |
| time/                   |              |
|    fps                  | 135          |
|    iterations           | 242          |
|    time_elapsed         | 457          |
|    total_timesteps      | 61952        |
| train/                  |              |
|    approx_kl            | 3.006775e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | 0.0053       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0918       |
|    n_updates            | 2410         |
|    policy_gradient_loss | -0.000128    |
|    value_loss           | 0.166        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 2.01e+04     |
|    ep_rew_mean          | 512          |
| time/                   |              |
|    fps                  | 135          |
|    iterations           | 251          |
|    time_elapsed         | 473          |
|    total_timesteps      | 64256        |
| train/                  |              |
|    approx_kl            | 5.501788e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | -0.0132      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.058        |
|    n_updates            | 2500         |
|    policy_gradient_loss | -4.71e-05    |
|    value_loss           | 0.108        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.14e+04      |
|    ep_rew_mean          | 471           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 260           |
|    time_elapsed         | 488           |
|    total_timesteps      | 66560         |
| train/                  |               |
|    approx_kl            | 1.4211982e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.00405       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0584        |
|    n_updates            | 2590          |
|    policy_gradient_loss | -0.00011      |
|    value_loss           | 0.107         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.14e+04      |
|    ep_rew_mean          | 471           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 269           |
|    time_elapsed         | 503           |
|    total_timesteps      | 68864         |
| train/                  |               |
|    approx_kl            | 1.2556557e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.0102       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0725        |
|    n_updates            | 2680          |
|    policy_gradient_loss | -9.71e-05     |
|    value_loss           | 0.167         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 2.14e+04     |
|    ep_rew_mean          | 471          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 278          |
|    time_elapsed         | 519          |
|    total_timesteps      | 71168        |
| train/                  |              |
|    approx_kl            | 5.597947e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | -0.00186     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0524       |
|    n_updates            | 2770         |
|    policy_gradient_loss | -0.000177    |
|    value_loss           | 0.12         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.14e+04      |
|    ep_rew_mean          | 471           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 288           |
|    time_elapsed         | 536           |
|    total_timesteps      | 73728         |
| train/                  |               |
|    approx_kl            | 1.8244609e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -3.34e-06     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.106         |
|    n_updates            | 2870          |
|    policy_gradient_loss | -0.000137     |
|    value_loss           | 0.314         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.14e+04      |
|    ep_rew_mean          | 471           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 297           |
|    time_elapsed         | 552           |
|    total_timesteps      | 76032         |
| train/                  |               |
|    approx_kl            | 7.6182187e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.000208      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.119         |
|    n_updates            | 2960          |
|    policy_gradient_loss | -0.000145     |
|    value_loss           | 0.238         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.14e+04      |
|    ep_rew_mean          | 471           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 306           |
|    time_elapsed         | 567           |
|    total_timesteps      | 78336         |
| train/                  |               |
|    approx_kl            | 1.1180528e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.0191        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.182         |
|    n_updates            | 3050          |
|    policy_gradient_loss | -4.23e-05     |
|    value_loss           | 0.284         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 2.14e+04     |
|    ep_rew_mean          | 471          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 315          |
|    time_elapsed         | 583          |
|    total_timesteps      | 80640        |
| train/                  |              |
|    approx_kl            | 4.355097e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | 0.11         |
|    learning_rate        | 1e-06        |
|    loss                 | 2.05         |
|    n_updates            | 3140         |
|    policy_gradient_loss | -9.14e-05    |
|    value_loss           | 5.71         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.07e+04      |
|    ep_rew_mean          | 542           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 324           |
|    time_elapsed         | 599           |
|    total_timesteps      | 82944         |
| train/                  |               |
|    approx_kl            | 8.4750354e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.00597       |
|    learning_rate        | 1e-06         |
|    loss                 | 232           |
|    n_updates            | 3230          |
|    policy_gradient_loss | -1.23e-05     |
|    value_loss           | 349           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 2.07e+04      |
|    ep_rew_mean          | 542           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 333           |
|    time_elapsed         | 614           |
|    total_timesteps      | 85248         |
| train/                  |               |
|    approx_kl            | 1.3371464e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.018        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.122         |
|    n_updates            | 3320          |
|    policy_gradient_loss | -0.000141     |
|    value_loss           | 0.23          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 2.07e+04     |
|    ep_rew_mean          | 542          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 342          |
|    time_elapsed         | 629          |
|    total_timesteps      | 87552        |
| train/                  |              |
|    approx_kl            | 6.179791e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | 0.000644     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.285        |
|    n_updates            | 3410         |
|    policy_gradient_loss | -0.00019     |
|    value_loss           | 0.433        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 2.07e+04     |
|    ep_rew_mean          | 542          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 351          |
|    time_elapsed         | 644          |
|    total_timesteps      | 89856        |
| train/                  |              |
|    approx_kl            | 7.470604e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | 0.000121     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.161        |
|    n_updates            | 3500         |
|    policy_gradient_loss | -0.000183    |
|    value_loss           | 0.313        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.82e+04     |
|    ep_rew_mean          | 570          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 360          |
|    time_elapsed         | 662          |
|    total_timesteps      | 92160        |
| train/                  |              |
|    approx_kl            | 1.094304e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | 4.77e-06     |
|    learning_rate        | 1e-06        |
|    loss                 | 150          |
|    n_updates            | 3590         |
|    policy_gradient_loss | -1.76e-06    |
|    value_loss           | 262          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.82e+04      |
|    ep_rew_mean          | 570           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 370           |
|    time_elapsed         | 681           |
|    total_timesteps      | 94720         |
| train/                  |               |
|    approx_kl            | 1.3702083e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.000397      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0596        |
|    n_updates            | 3690          |
|    policy_gradient_loss | -5.09e-05     |
|    value_loss           | 0.169         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.82e+04      |
|    ep_rew_mean          | 570           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 379           |
|    time_elapsed         | 697           |
|    total_timesteps      | 97024         |
| train/                  |               |
|    approx_kl            | 1.1143275e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.00171       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0962        |
|    n_updates            | 3780          |
|    policy_gradient_loss | -8.33e-05     |
|    value_loss           | 0.183         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 596           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 388           |
|    time_elapsed         | 714           |
|    total_timesteps      | 99328         |
| train/                  |               |
|    approx_kl            | 2.4689361e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.00388       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0795        |
|    n_updates            | 3870          |
|    policy_gradient_loss | -0.000193     |
|    value_loss           | 0.151         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 596           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 397           |
|    time_elapsed         | 731           |
|    total_timesteps      | 101632        |
| train/                  |               |
|    approx_kl            | 3.9956067e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.00226       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.073         |
|    n_updates            | 3960          |
|    policy_gradient_loss | -0.000206     |
|    value_loss           | 0.184         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 596           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 406           |
|    time_elapsed         | 748           |
|    total_timesteps      | 103936        |
| train/                  |               |
|    approx_kl            | 1.7608982e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.00167      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0704        |
|    n_updates            | 4050          |
|    policy_gradient_loss | -0.00013      |
|    value_loss           | 0.129         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 596           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 415           |
|    time_elapsed         | 764           |
|    total_timesteps      | 106240        |
| train/                  |               |
|    approx_kl            | 4.4410117e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.00122       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0929        |
|    n_updates            | 4140          |
|    policy_gradient_loss | -0.000262     |
|    value_loss           | 0.149         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 596           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 424           |
|    time_elapsed         | 780           |
|    total_timesteps      | 108544        |
| train/                  |               |
|    approx_kl            | 6.5143686e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 4.4e-05       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.233         |
|    n_updates            | 4230          |
|    policy_gradient_loss | -0.000191     |
|    value_loss           | 0.295         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 596          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 433          |
|    time_elapsed         | 797          |
|    total_timesteps      | 110848       |
| train/                  |              |
|    approx_kl            | 4.216563e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | 0.0217       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0941       |
|    n_updates            | 4320         |
|    policy_gradient_loss | -4.03e-05    |
|    value_loss           | 0.21         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 596          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 442          |
|    time_elapsed         | 812          |
|    total_timesteps      | 113152       |
| train/                  |              |
|    approx_kl            | 7.289462e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | -0.000995    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0849       |
|    n_updates            | 4410         |
|    policy_gradient_loss | -0.00041     |
|    value_loss           | 0.139        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 596           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 452           |
|    time_elapsed         | 829           |
|    total_timesteps      | 115712        |
| train/                  |               |
|    approx_kl            | 1.8370338e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.0474        |
|    learning_rate        | 1e-06         |
|    loss                 | 125           |
|    n_updates            | 4510          |
|    policy_gradient_loss | 1.41e-05      |
|    value_loss           | 271           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 596           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 462           |
|    time_elapsed         | 846           |
|    total_timesteps      | 118272        |
| train/                  |               |
|    approx_kl            | 1.4756806e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.00123       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.071         |
|    n_updates            | 4610          |
|    policy_gradient_loss | -8.13e-05     |
|    value_loss           | 0.161         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 596           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 471           |
|    time_elapsed         | 862           |
|    total_timesteps      | 120576        |
| train/                  |               |
|    approx_kl            | 2.1099113e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | -0.0173       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0657        |
|    n_updates            | 4700          |
|    policy_gradient_loss | -9.33e-05     |
|    value_loss           | 0.236         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 596          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 480          |
|    time_elapsed         | 877          |
|    total_timesteps      | 122880       |
| train/                  |              |
|    approx_kl            | 8.479459e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | -0.00173     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0673       |
|    n_updates            | 4790         |
|    policy_gradient_loss | -0.000323    |
|    value_loss           | 0.14         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.76e+04      |
|    ep_rew_mean          | 569           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 489           |
|    time_elapsed         | 892           |
|    total_timesteps      | 125184        |
| train/                  |               |
|    approx_kl            | 1.1660159e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | -0.00319      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0714        |
|    n_updates            | 4880          |
|    policy_gradient_loss | -0.000104     |
|    value_loss           | 0.184         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.76e+04      |
|    ep_rew_mean          | 569           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 498           |
|    time_elapsed         | 907           |
|    total_timesteps      | 127488        |
| train/                  |               |
|    approx_kl            | 3.7348364e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.0397        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0882        |
|    n_updates            | 4970          |
|    policy_gradient_loss | -0.000186     |
|    value_loss           | 0.147         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.76e+04      |
|    ep_rew_mean          | 569           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 507           |
|    time_elapsed         | 922           |
|    total_timesteps      | 129792        |
| train/                  |               |
|    approx_kl            | 8.8568777e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.0434        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0406        |
|    n_updates            | 5060          |
|    policy_gradient_loss | -7.26e-05     |
|    value_loss           | 0.126         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.76e+04     |
|    ep_rew_mean          | 569          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 517          |
|    time_elapsed         | 940          |
|    total_timesteps      | 132352       |
| train/                  |              |
|    approx_kl            | 7.899944e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | 8.11e-06     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.151        |
|    n_updates            | 5160         |
|    policy_gradient_loss | -9.83e-05    |
|    value_loss           | 0.292        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.76e+04      |
|    ep_rew_mean          | 569           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 526           |
|    time_elapsed         | 955           |
|    total_timesteps      | 134656        |
| train/                  |               |
|    approx_kl            | 2.5711488e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.00322       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0764        |
|    n_updates            | 5250          |
|    policy_gradient_loss | -9.88e-05     |
|    value_loss           | 0.22          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.76e+04      |
|    ep_rew_mean          | 569           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 535           |
|    time_elapsed         | 971           |
|    total_timesteps      | 136960        |
| train/                  |               |
|    approx_kl            | 2.5286572e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.000174      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.125         |
|    n_updates            | 5340          |
|    policy_gradient_loss | -0.000201     |
|    value_loss           | 0.279         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.76e+04     |
|    ep_rew_mean          | 569          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 544          |
|    time_elapsed         | 986          |
|    total_timesteps      | 139264       |
| train/                  |              |
|    approx_kl            | 1.601642e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | -0.000668    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.112        |
|    n_updates            | 5430         |
|    policy_gradient_loss | -0.000106    |
|    value_loss           | 0.191        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.74e+04      |
|    ep_rew_mean          | 572           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 553           |
|    time_elapsed         | 1003          |
|    total_timesteps      | 141568        |
| train/                  |               |
|    approx_kl            | 2.0542648e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.0248        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0694        |
|    n_updates            | 5520          |
|    policy_gradient_loss | -5.44e-05     |
|    value_loss           | 0.142         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.74e+04     |
|    ep_rew_mean          | 572          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 562          |
|    time_elapsed         | 1018         |
|    total_timesteps      | 143872       |
| train/                  |              |
|    approx_kl            | 2.776971e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | 0.000318     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0641       |
|    n_updates            | 5610         |
|    policy_gradient_loss | -3.78e-05    |
|    value_loss           | 0.164        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.74e+04      |
|    ep_rew_mean          | 572           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 572           |
|    time_elapsed         | 1035          |
|    total_timesteps      | 146432        |
| train/                  |               |
|    approx_kl            | 4.6018977e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 6.99e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0845        |
|    n_updates            | 5710          |
|    policy_gradient_loss | -0.000236     |
|    value_loss           | 0.149         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.74e+04      |
|    ep_rew_mean          | 572           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 581           |
|    time_elapsed         | 1051          |
|    total_timesteps      | 148736        |
| train/                  |               |
|    approx_kl            | 2.1208543e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.00012       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.193         |
|    n_updates            | 5800          |
|    policy_gradient_loss | -0.000187     |
|    value_loss           | 0.383         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.74e+04      |
|    ep_rew_mean          | 572           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 590           |
|    time_elapsed         | 1067          |
|    total_timesteps      | 151040        |
| train/                  |               |
|    approx_kl            | 1.6549602e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.000194      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.142         |
|    n_updates            | 5890          |
|    policy_gradient_loss | -0.000114     |
|    value_loss           | 0.352         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.74e+04      |
|    ep_rew_mean          | 572           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 599           |
|    time_elapsed         | 1082          |
|    total_timesteps      | 153344        |
| train/                  |               |
|    approx_kl            | 3.4391414e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.00109       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0946        |
|    n_updates            | 5980          |
|    policy_gradient_loss | -0.000124     |
|    value_loss           | 0.154         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.74e+04     |
|    ep_rew_mean          | 572          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 608          |
|    time_elapsed         | 1098         |
|    total_timesteps      | 155648       |
| train/                  |              |
|    approx_kl            | 3.217021e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | 0.000417     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0822       |
|    n_updates            | 6070         |
|    policy_gradient_loss | -0.000134    |
|    value_loss           | 0.182        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.73e+04      |
|    ep_rew_mean          | 567           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 617           |
|    time_elapsed         | 1113          |
|    total_timesteps      | 157952        |
| train/                  |               |
|    approx_kl            | 1.4873222e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.0205        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.039         |
|    n_updates            | 6160          |
|    policy_gradient_loss | -7.08e-05     |
|    value_loss           | 0.0955        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.73e+04     |
|    ep_rew_mean          | 567          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 626          |
|    time_elapsed         | 1130         |
|    total_timesteps      | 160256       |
| train/                  |              |
|    approx_kl            | 9.017531e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | 0.00809      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0531       |
|    n_updates            | 6250         |
|    policy_gradient_loss | -1.86e-05    |
|    value_loss           | 0.108        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.73e+04      |
|    ep_rew_mean          | 567           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 636           |
|    time_elapsed         | 1147          |
|    total_timesteps      | 162816        |
| train/                  |               |
|    approx_kl            | 1.8100254e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | -0.00566      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0667        |
|    n_updates            | 6350          |
|    policy_gradient_loss | -0.000187     |
|    value_loss           | 0.112         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 569          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 645          |
|    time_elapsed         | 1163         |
|    total_timesteps      | 165120       |
| train/                  |              |
|    approx_kl            | 7.352792e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | 0.000269     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.046        |
|    n_updates            | 6440         |
|    policy_gradient_loss | -1.51e-05    |
|    value_loss           | 0.135        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 569           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 654           |
|    time_elapsed         | 1178          |
|    total_timesteps      | 167424        |
| train/                  |               |
|    approx_kl            | 1.5057158e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | -0.000328     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0781        |
|    n_updates            | 6530          |
|    policy_gradient_loss | -0.000153     |
|    value_loss           | 0.299         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 569          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 663          |
|    time_elapsed         | 1194         |
|    total_timesteps      | 169728       |
| train/                  |              |
|    approx_kl            | 7.867347e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | 1.14e-05     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0861       |
|    n_updates            | 6620         |
|    policy_gradient_loss | -0.000151    |
|    value_loss           | 0.165        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 569           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 672           |
|    time_elapsed         | 1210          |
|    total_timesteps      | 172032        |
| train/                  |               |
|    approx_kl            | 1.3890676e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | -0.00315      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0572        |
|    n_updates            | 6710          |
|    policy_gradient_loss | -0.000119     |
|    value_loss           | 0.139         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 569           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 681           |
|    time_elapsed         | 1226          |
|    total_timesteps      | 174336        |
| train/                  |               |
|    approx_kl            | 8.0256723e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 9.52e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0961        |
|    n_updates            | 6800          |
|    policy_gradient_loss | -7.26e-05     |
|    value_loss           | 0.21          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 569           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 690           |
|    time_elapsed         | 1241          |
|    total_timesteps      | 176640        |
| train/                  |               |
|    approx_kl            | 4.2608008e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.00222       |
|    learning_rate        | 1e-06         |
|    loss                 | 85.9          |
|    n_updates            | 6890          |
|    policy_gradient_loss | -4.31e-06     |
|    value_loss           | 178           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.61e+04      |
|    ep_rew_mean          | 600           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 699           |
|    time_elapsed         | 1257          |
|    total_timesteps      | 178944        |
| train/                  |               |
|    approx_kl            | 3.3224933e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 6.74e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0841        |
|    n_updates            | 6980          |
|    policy_gradient_loss | -4.07e-05     |
|    value_loss           | 0.181         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.61e+04      |
|    ep_rew_mean          | 600           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 708           |
|    time_elapsed         | 1273          |
|    total_timesteps      | 181248        |
| train/                  |               |
|    approx_kl            | 3.3755787e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 2.75e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0928        |
|    n_updates            | 7070          |
|    policy_gradient_loss | -0.000321     |
|    value_loss           | 0.167         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.61e+04      |
|    ep_rew_mean          | 600           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 717           |
|    time_elapsed         | 1288          |
|    total_timesteps      | 183552        |
| train/                  |               |
|    approx_kl            | 5.6810677e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.0114        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.145         |
|    n_updates            | 7160          |
|    policy_gradient_loss | -8.4e-05      |
|    value_loss           | 0.311         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.61e+04      |
|    ep_rew_mean          | 600           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 726           |
|    time_elapsed         | 1303          |
|    total_timesteps      | 185856        |
| train/                  |               |
|    approx_kl            | 1.8964056e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 6.54e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0868        |
|    n_updates            | 7250          |
|    policy_gradient_loss | -0.000172     |
|    value_loss           | 0.274         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.61e+04     |
|    ep_rew_mean          | 600          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 735          |
|    time_elapsed         | 1319         |
|    total_timesteps      | 188160       |
| train/                  |              |
|    approx_kl            | 6.139744e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | 0.0114       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.135        |
|    n_updates            | 7340         |
|    policy_gradient_loss | -7.93e-05    |
|    value_loss           | 0.244        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.61e+04      |
|    ep_rew_mean          | 600           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 744           |
|    time_elapsed         | 1336          |
|    total_timesteps      | 190464        |
| train/                  |               |
|    approx_kl            | 0.00014157011 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.00226       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0429        |
|    n_updates            | 7430          |
|    policy_gradient_loss | -0.000433     |
|    value_loss           | 0.117         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.61e+04     |
|    ep_rew_mean          | 600          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 753          |
|    time_elapsed         | 1351         |
|    total_timesteps      | 192768       |
| train/                  |              |
|    approx_kl            | 4.954124e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | 0.00335      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0538       |
|    n_updates            | 7520         |
|    policy_gradient_loss | -0.000386    |
|    value_loss           | 0.0927       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.61e+04      |
|    ep_rew_mean          | 587           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 762           |
|    time_elapsed         | 1367          |
|    total_timesteps      | 195072        |
| train/                  |               |
|    approx_kl            | 2.5797635e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | -0.00631      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0838        |
|    n_updates            | 7610          |
|    policy_gradient_loss | -2.39e-05     |
|    value_loss           | 0.162         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.61e+04     |
|    ep_rew_mean          | 587          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 771          |
|    time_elapsed         | 1382         |
|    total_timesteps      | 197376       |
| train/                  |              |
|    approx_kl            | 6.041955e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | -0.000139    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0375       |
|    n_updates            | 7700         |
|    policy_gradient_loss | -0.000135    |
|    value_loss           | 0.0883       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.61e+04      |
|    ep_rew_mean          | 587           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 780           |
|    time_elapsed         | 1397          |
|    total_timesteps      | 199680        |
| train/                  |               |
|    approx_kl            | 1.5357509e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | -0.0154       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0523        |
|    n_updates            | 7790          |
|    policy_gradient_loss | -8.37e-05     |
|    value_loss           | 0.129         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.61e+04     |
|    ep_rew_mean          | 587          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 790          |
|    time_elapsed         | 1415         |
|    total_timesteps      | 202240       |
| train/                  |              |
|    approx_kl            | 1.629442e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | 0.00648      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0931       |
|    n_updates            | 7890         |
|    policy_gradient_loss | -0.000234    |
|    value_loss           | 0.206        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.61e+04    |
|    ep_rew_mean          | 587         |
| time/                   |             |
|    fps                  | 142         |
|    iterations           | 799         |
|    time_elapsed         | 1430        |
|    total_timesteps      | 204544      |
| train/                  |             |
|    approx_kl            | 2.58605e-06 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.92       |
|    explained_variance   | 1.19e-05    |
|    learning_rate        | 1e-06       |
|    loss                 | 0.135       |
|    n_updates            | 7980        |
|    policy_gradient_loss | -0.00026    |
|    value_loss           | 0.296       |
-----------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.61e+04

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.61e+04      |
|    ep_rew_mean          | 587           |
| time/                   |               |
|    fps                  | 143           |
|    iterations           | 808           |
|    time_elapsed         | 1446          |
|    total_timesteps      | 206848        |
| train/                  |               |
|    approx_kl            | 9.1502443e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 0.0239        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0619        |
|    n_updates            | 8070          |
|    policy_gradient_loss | -6.5e-05      |
|    value_loss           | 0.161         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.61e+04     |
|    ep_rew_mean          | 587          |
| time/                   |              |
|    fps                  | 143          |
|    iterations           | 817          |
|    time_elapsed         | 1461         |
|    total_timesteps      | 209152       |
| train/                  |              |
|    approx_kl            | 3.608875e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.93        |
|    explained_variance   | 0.00021      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0594       |
|    n_updates            | 8160         |
|    policy_gradient_loss | -5.17e-05    |
|    value_loss           | 0.117        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.61e+04      |
|    ep_rew_mean          | 587           |
| time/                   |               |
|    fps                  | 143           |
|    iterations           | 826           |
|    time_elapsed         | 1477          |
|    total_timesteps      | 211456        |
| train/                  |               |
|    approx_kl            | 8.4447674e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 0.0187        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0952        |
|    n_updates            | 8250          |
|    policy_gradient_loss | -0.000105     |
|    value_loss           | 0.135         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 604          |
| time/                   |              |
|    fps                  | 143          |
|    iterations           | 835          |
|    time_elapsed         | 1491         |
|    total_timesteps      | 213760       |
| train/                  |              |
|    approx_kl            | 4.004687e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | -0.00169     |
|    learning_rate        | 1e-06        |
|    loss                 | 53.4         |
|    n_updates            | 8340         |
|    policy_gradient_loss | 7.83e-06     |
|    value_loss           | 171          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 604          |
| time/                   |              |
|    fps                  | 143          |
|    iterations           | 845          |
|    time_elapsed         | 1508         |
|    total_timesteps      | 216320       |
| train/                  |              |
|    approx_kl            | 8.707866e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | 0.0104       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0478       |
|    n_updates            | 8440         |
|    policy_gradient_loss | -6.28e-05    |
|    value_loss           | 0.092        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 604          |
| time/                   |              |
|    fps                  | 143          |
|    iterations           | 854          |
|    time_elapsed         | 1523         |
|    total_timesteps      | 218624       |
| train/                  |              |
|    approx_kl            | 3.966503e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | 0.000325     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0602       |
|    n_updates            | 8530         |
|    policy_gradient_loss | -0.000179    |
|    value_loss           | 0.144        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 143           |
|    iterations           | 863           |
|    time_elapsed         | 1540          |
|    total_timesteps      | 220928        |
| train/                  |               |
|    approx_kl            | 7.2154216e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 0.000414      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0448        |
|    n_updates            | 8620          |
|    policy_gradient_loss | -0.000348     |
|    value_loss           | 0.0914        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 143           |
|    iterations           | 872           |
|    time_elapsed         | 1557          |
|    total_timesteps      | 223232        |
| train/                  |               |
|    approx_kl            | 8.1257895e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | -0.00127      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.104         |
|    n_updates            | 8710          |
|    policy_gradient_loss | -1.18e-05     |
|    value_loss           | 0.238         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 604          |
| time/                   |              |
|    fps                  | 143          |
|    iterations           | 881          |
|    time_elapsed         | 1574         |
|    total_timesteps      | 225536       |
| train/                  |              |
|    approx_kl            | 2.104626e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | 0.00705      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0976       |
|    n_updates            | 8800         |
|    policy_gradient_loss | -0.000449    |
|    value_loss           | 0.225        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 143           |
|    iterations           | 890           |
|    time_elapsed         | 1590          |
|    total_timesteps      | 227840        |
| train/                  |               |
|    approx_kl            | 1.0910444e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 0.00226       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0449        |
|    n_updates            | 8890          |
|    policy_gradient_loss | -5.95e-05     |
|    value_loss           | 0.118         |
-------------------------------------------
----------------------------------------
| rollout/                |        

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 143           |
|    iterations           | 899           |
|    time_elapsed         | 1608          |
|    total_timesteps      | 230144        |
| train/                  |               |
|    approx_kl            | 3.4226105e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 0.0124        |
|    learning_rate        | 1e-06         |
|    loss                 | 22.4          |
|    n_updates            | 8980          |
|    policy_gradient_loss | 3.66e-07      |
|    value_loss           | 52.6          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 908           |
|    time_elapsed         | 1625          |
|    total_timesteps      | 232448        |
| train/                  |               |
|    approx_kl            | 7.6158904e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 5.26e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0705        |
|    n_updates            | 9070          |
|    policy_gradient_loss | -2.75e-05     |
|    value_loss           | 0.145         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 917           |
|    time_elapsed         | 1642          |
|    total_timesteps      | 234752        |
| train/                  |               |
|    approx_kl            | 2.3492612e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | -3.6e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0742        |
|    n_updates            | 9160          |
|    policy_gradient_loss | -3.58e-05     |
|    value_loss           | 0.161         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 926           |
|    time_elapsed         | 1659          |
|    total_timesteps      | 237056        |
| train/                  |               |
|    approx_kl            | 1.6563572e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | -0.000172     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0837        |
|    n_updates            | 9250          |
|    policy_gradient_loss | -5.49e-05     |
|    value_loss           | 0.173         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 935           |
|    time_elapsed         | 1676          |
|    total_timesteps      | 239360        |
| train/                  |               |
|    approx_kl            | 1.5553553e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 0.00337       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.151         |
|    n_updates            | 9340          |
|    policy_gradient_loss | -0.000333     |
|    value_loss           | 0.258         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 944           |
|    time_elapsed         | 1693          |
|    total_timesteps      | 241664        |
| train/                  |               |
|    approx_kl            | 5.0845556e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | -0.000661     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.226         |
|    n_updates            | 9430          |
|    policy_gradient_loss | -0.000205     |
|    value_loss           | 0.396         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.64e+04    |
|    ep_rew_mean          | 604         |
| time/                   |             |
|    fps                  | 142         |
|    iterations           | 953         |
|    time_elapsed         | 1710        |
|    total_timesteps      | 243968      |
| train/                  |             |
|    approx_kl            | 8.84796e-05 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.92       |
|    explained_variance   | -0.000118   |
|    learning_rate        | 1e-06       |
|    loss                 | 0.045       |
|    n_updates            | 9520        |
|    policy_gradient_loss | -0.00041    |
|    value_loss           | 0.104       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 604           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 963           |
|    time_elapsed         | 1729          |
|    total_timesteps      | 246528        |
| train/                  |               |
|    approx_kl            | 1.0158401e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 0.00347       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0396        |
|    n_updates            | 9620          |
|    policy_gradient_loss | -8.53e-05     |
|    value_loss           | 0.107         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 621          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 972          |
|    time_elapsed         | 1746         |
|    total_timesteps      | 248832       |
| train/                  |              |
|    approx_kl            | 8.144416e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | -0.000218    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0568       |
|    n_updates            | 9710         |
|    policy_gradient_loss | -9.25e-05    |
|    value_loss           | 0.117        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.66e+04    |
|    ep_rew_mean          | 621         |
| time/                   |             |
|    fps                  | 142         |
|    iterations           | 981         |
|    time_elapsed         | 1763        |
|    total_timesteps      | 251136      |
| train/                  |             |
|    approx_kl            | 6.56303e-06 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.92       |
|    explained_variance   | -0.000462   |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0663      |
|    n_updates            | 9800        |
|    policy_gradient_loss | -0.000165   |
|    value_loss           | 0.138       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 621           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 990           |
|    time_elapsed         | 1780          |
|    total_timesteps      | 253440        |
| train/                  |               |
|    approx_kl            | 1.1620577e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | -0.0257       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.057         |
|    n_updates            | 9890          |
|    policy_gradient_loss | -7.13e-05     |
|    value_loss           | 0.103         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 621          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1000         |
|    time_elapsed         | 1799         |
|    total_timesteps      | 256000       |
| train/                  |              |
|    approx_kl            | 5.518086e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | -5.56e-05    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0654       |
|    n_updates            | 9990         |
|    policy_gradient_loss | -5.16e-05    |
|    value_loss           | 0.108        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 621           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1009          |
|    time_elapsed         | 1815          |
|    total_timesteps      | 258304        |
| train/                  |               |
|    approx_kl            | 1.0244548e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | -2.79e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 31.7          |
|    n_updates            | 10080         |
|    policy_gradient_loss | -3.35e-06     |
|    value_loss           | 98.9          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 621           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1018          |
|    time_elapsed         | 1833          |
|    total_timesteps      | 260608        |
| train/                  |               |
|    approx_kl            | 3.7166756e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 6.37e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.143         |
|    n_updates            | 10170         |
|    policy_gradient_loss | -0.000175     |
|    value_loss           | 0.231         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 621          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1027         |
|    time_elapsed         | 1850         |
|    total_timesteps      | 262912       |
| train/                  |              |
|    approx_kl            | 9.918585e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | -3.46e-05    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.116        |
|    n_updates            | 10260        |
|    policy_gradient_loss | -6.13e-05    |
|    value_loss           | 0.204        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 621          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1036         |
|    time_elapsed         | 1867         |
|    total_timesteps      | 265216       |
| train/                  |              |
|    approx_kl            | 7.084105e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.92        |
|    explained_variance   | 0.00446      |
|    learning_rate        | 1e-06        |
|    loss                 | 234          |
|    n_updates            | 10350        |
|    policy_gradient_loss | -9.23e-05    |
|    value_loss           | 508          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 621           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1045          |
|    time_elapsed         | 1884          |
|    total_timesteps      | 267520        |
| train/                  |               |
|    approx_kl            | 1.0081567e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.00165       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.212         |
|    n_updates            | 10440         |
|    policy_gradient_loss | -0.000159     |
|    value_loss           | 0.281         |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 621          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1054         |
|    time_elapsed         | 1901         |
|    total_timesteps      | 269824       |
| train/                  |              |
|    approx_kl            | 9.567244e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.00559      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0423       |
|    n_updates            | 10530        |
|    policy_gradient_loss | -0.000404    |
|    value_loss           | 0.143        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 621          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1063         |
|    time_elapsed         | 1918         |
|    total_timesteps      | 272128       |
| train/                  |              |
|    approx_kl            | 5.553011e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 8.92e-05     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0777       |
|    n_updates            | 10620        |
|    policy_gradient_loss | -7.27e-05    |
|    value_loss           | 0.129        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 614           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1072          |
|    time_elapsed         | 1935          |
|    total_timesteps      | 274432        |
| train/                  |               |
|    approx_kl            | 1.4482066e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.00827       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0465        |
|    n_updates            | 10710         |
|    policy_gradient_loss | -2.49e-05     |
|    value_loss           | 0.099         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 614          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1081         |
|    time_elapsed         | 1952         |
|    total_timesteps      | 276736       |
| train/                  |              |
|    approx_kl            | 8.640345e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.00541      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.049        |
|    n_updates            | 10800        |
|    policy_gradient_loss | -8.22e-05    |
|    value_loss           | 0.125        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 614          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1090         |
|    time_elapsed         | 1969         |
|    total_timesteps      | 279040       |
| train/                  |              |
|    approx_kl            | 3.622612e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.000735     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0834       |
|    n_updates            | 10890        |
|    policy_gradient_loss | -0.000187    |
|    value_loss           | 0.138        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 614           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1099          |
|    time_elapsed         | 1987          |
|    total_timesteps      | 281344        |
| train/                  |               |
|    approx_kl            | 1.7229468e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | -0.0202       |
|    learning_rate        | 1e-06         |
|    loss                 | 499           |
|    n_updates            | 10980         |
|    policy_gradient_loss | -3.34e-06     |
|    value_loss           | 938           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 614           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1108          |
|    time_elapsed         | 2004          |
|    total_timesteps      | 283648        |
| train/                  |               |
|    approx_kl            | 5.7239085e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | -0.0105       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.102         |
|    n_updates            | 11070         |
|    policy_gradient_loss | -0.000184     |
|    value_loss           | 0.24          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 614          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1117         |
|    time_elapsed         | 2021         |
|    total_timesteps      | 285952       |
| train/                  |              |
|    approx_kl            | 4.924601e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.00212      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.11         |
|    n_updates            | 11160        |
|    policy_gradient_loss | -0.000129    |
|    value_loss           | 0.22         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 614          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1126         |
|    time_elapsed         | 2038         |
|    total_timesteps      | 288256       |
| train/                  |              |
|    approx_kl            | 5.753245e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.00317      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0603       |
|    n_updates            | 11250        |
|    policy_gradient_loss | -7.68e-05    |
|    value_loss           | 0.154        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 614          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1136         |
|    time_elapsed         | 2057         |
|    total_timesteps      | 290816       |
| train/                  |              |
|    approx_kl            | 3.608875e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.00387      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0459       |
|    n_updates            | 11350        |
|    policy_gradient_loss | -3.08e-06    |
|    value_loss           | 0.0878       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 614           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1145          |
|    time_elapsed         | 2074          |
|    total_timesteps      | 293120        |
| train/                  |               |
|    approx_kl            | 5.5946875e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.031         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0942        |
|    n_updates            | 11440         |
|    policy_gradient_loss | -8.98e-05     |
|    value_loss           | 0.161         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 614           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1154          |
|    time_elapsed         | 2091          |
|    total_timesteps      | 295424        |
| train/                  |               |
|    approx_kl            | 2.0596199e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.00105       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.09          |
|    n_updates            | 11530         |
|    policy_gradient_loss | -0.000111     |
|    value_loss           | 0.157         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 613          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1163         |
|    time_elapsed         | 2108         |
|    total_timesteps      | 297728       |
| train/                  |              |
|    approx_kl            | 8.614734e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.0052       |
|    learning_rate        | 1e-06        |
|    loss                 | 319          |
|    n_updates            | 11620        |
|    policy_gradient_loss | 1.12e-07     |
|    value_loss           | 752          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 613           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1172          |
|    time_elapsed         | 2126          |
|    total_timesteps      | 300032        |
| train/                  |               |
|    approx_kl            | 1.2367964e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.0031        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0412        |
|    n_updates            | 11710         |
|    policy_gradient_loss | -5.84e-05     |
|    value_loss           | 0.0946        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 613           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1181          |
|    time_elapsed         | 2143          |
|    total_timesteps      | 302336        |
| train/                  |               |
|    approx_kl            | 2.0489097e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.00353       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0796        |
|    n_updates            | 11800         |
|    policy_gradient_loss | -2.09e-05     |
|    value_loss           | 0.144         |
-------------------------------------------
--------------------------------------------
| rollout/                |    

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 613           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1190          |
|    time_elapsed         | 2160          |
|    total_timesteps      | 304640        |
| train/                  |               |
|    approx_kl            | 3.9227307e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | -0.00569      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0462        |
|    n_updates            | 11890         |
|    policy_gradient_loss | -3.15e-05     |
|    value_loss           | 0.103         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 613           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1199          |
|    time_elapsed         | 2177          |
|    total_timesteps      | 306944        |
| train/                  |               |
|    approx_kl            | 1.7723069e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | -0.00196      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.14          |
|    n_updates            | 11980         |
|    policy_gradient_loss | -7.12e-05     |
|    value_loss           | 0.35          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 613           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1208          |
|    time_elapsed         | 2194          |
|    total_timesteps      | 309248        |
| train/                  |               |
|    approx_kl            | 1.0157237e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.0047        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.135         |
|    n_updates            | 12070         |
|    policy_gradient_loss | -9.58e-05     |
|    value_loss           | 0.317         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 613          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1217         |
|    time_elapsed         | 2211         |
|    total_timesteps      | 311552       |
| train/                  |              |
|    approx_kl            | 8.333009e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | -0.0122      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0521       |
|    n_updates            | 12160        |
|    policy_gradient_loss | -6.78e-05    |
|    value_loss           | 0.113        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 607          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1226         |
|    time_elapsed         | 2227         |
|    total_timesteps      | 313856       |
| train/                  |              |
|    approx_kl            | 3.098976e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.0154       |
|    learning_rate        | 1e-06        |
|    loss                 | 294          |
|    n_updates            | 12250        |
|    policy_gradient_loss | 1.82e-05     |
|    value_loss           | 642          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 607           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1235          |
|    time_elapsed         | 2242          |
|    total_timesteps      | 316160        |
| train/                  |               |
|    approx_kl            | 3.3841934e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.012         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0416        |
|    n_updates            | 12340         |
|    policy_gradient_loss | -0.000311     |
|    value_loss           | 0.0945        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 607          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1244         |
|    time_elapsed         | 2258         |
|    total_timesteps      | 318464       |
| train/                  |              |
|    approx_kl            | 9.284122e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.000211     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0561       |
|    n_updates            | 12430        |
|    policy_gradient_loss | -0.000143    |
|    value_loss           | 0.143        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 607           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1253          |
|    time_elapsed         | 2275          |
|    total_timesteps      | 320768        |
| train/                  |               |
|    approx_kl            | 5.9744343e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | -5.13e-06     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0433        |
|    n_updates            | 12520         |
|    policy_gradient_loss | -7.11e-05     |
|    value_loss           | 0.0963        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 607          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1262         |
|    time_elapsed         | 2291         |
|    total_timesteps      | 323072       |
| train/                  |              |
|    approx_kl            | 5.064765e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | -0.00452     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.137        |
|    n_updates            | 12610        |
|    policy_gradient_loss | -5.82e-05    |
|    value_loss           | 0.289        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 607           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1271          |
|    time_elapsed         | 2306          |
|    total_timesteps      | 325376        |
| train/                  |               |
|    approx_kl            | 1.7241109e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.00226       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.119         |
|    n_updates            | 12700         |
|    policy_gradient_loss | -0.000133     |
|    value_loss           | 0.309         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 607          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1280         |
|    time_elapsed         | 2322         |
|    total_timesteps      | 327680       |
| train/                  |              |
|    approx_kl            | 4.852889e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | 0.0151       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0832       |
|    n_updates            | 12790        |
|    policy_gradient_loss | -2.79e-05    |
|    value_loss           | 0.143        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 612          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1290         |
|    time_elapsed         | 2341         |
|    total_timesteps      | 330240       |
| train/                  |              |
|    approx_kl            | 5.355105e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | -0.00478     |
|    learning_rate        | 1e-06        |
|    loss                 | 469          |
|    n_updates            | 12890        |
|    policy_gradient_loss | 1.88e-06     |
|    value_loss           | 908          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 612          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1299         |
|    time_elapsed         | 2357         |
|    total_timesteps      | 332544       |
| train/                  |              |
|    approx_kl            | 4.239846e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.91        |
|    explained_variance   | -0.0284      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0855       |
|    n_updates            | 12980        |
|    policy_gradient_loss | -3.45e-05    |
|    value_loss           | 0.155        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 612           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1308          |
|    time_elapsed         | 2374          |
|    total_timesteps      | 334848        |
| train/                  |               |
|    approx_kl            | 1.1352822e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.00374       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0556        |
|    n_updates            | 13070         |
|    policy_gradient_loss | -8.09e-05     |
|    value_loss           | 0.119         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 612           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1317          |
|    time_elapsed         | 2391          |
|    total_timesteps      | 337152        |
| train/                  |               |
|    approx_kl            | 3.1499658e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.91         |
|    explained_variance   | 0.00417       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.039         |
|    n_updates            | 13160         |
|    policy_gradient_loss | -4.51e-05     |
|    value_loss           | 0.0993        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 612           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1326          |
|    time_elapsed         | 2407          |
|    total_timesteps      | 339456        |
| train/                  |               |
|    approx_kl            | 6.5667555e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.00041      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.103         |
|    n_updates            | 13250         |
|    policy_gradient_loss | -0.000364     |
|    value_loss           | 0.242         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 612           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1335          |
|    time_elapsed         | 2425          |
|    total_timesteps      | 341760        |
| train/                  |               |
|    approx_kl            | 2.0270701e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 0.000423      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.11          |
|    n_updates            | 13340         |
|    policy_gradient_loss | -0.000199     |
|    value_loss           | 0.24          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 612          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1345         |
|    time_elapsed         | 2444         |
|    total_timesteps      | 344320       |
| train/                  |              |
|    approx_kl            | 2.229819e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | 0.00033      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0476       |
|    n_updates            | 13440        |
|    policy_gradient_loss | -0.000204    |
|    value_loss           | 0.107        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 606           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1354          |
|    time_elapsed         | 2461          |
|    total_timesteps      | 346624        |
| train/                  |               |
|    approx_kl            | 1.1594966e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 0.00656       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0627        |
|    n_updates            | 13530         |
|    policy_gradient_loss | -3.42e-05     |
|    value_loss           | 0.126         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 606           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1363          |
|    time_elapsed         | 2477          |
|    total_timesteps      | 348928        |
| train/                  |               |
|    approx_kl            | 1.9441359e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.0116       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0861        |
|    n_updates            | 13620         |
|    policy_gradient_loss | -1.57e-05     |
|    value_loss           | 0.125         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 606           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1373          |
|    time_elapsed         | 2496          |
|    total_timesteps      | 351488        |
| train/                  |               |
|    approx_kl            | 2.4493784e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 0.0385        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.056         |
|    n_updates            | 13720         |
|    policy_gradient_loss | -4.79e-05     |
|    value_loss           | 0.0952        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 606           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1382          |
|    time_elapsed         | 2512          |
|    total_timesteps      | 353792        |
| train/                  |               |
|    approx_kl            | 2.0279549e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.0696       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0431        |
|    n_updates            | 13810         |
|    policy_gradient_loss | -2.31e-05     |
|    value_loss           | 0.0926        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.54e+04      |
|    ep_rew_mean          | 610           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1391          |
|    time_elapsed         | 2527          |
|    total_timesteps      | 356096        |
| train/                  |               |
|    approx_kl            | 3.4226105e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 0.0394        |
|    learning_rate        | 1e-06         |
|    loss                 | 55            |
|    n_updates            | 13900         |
|    policy_gradient_loss | 1.45e-05      |
|    value_loss           | 174           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.54e+04      |
|    ep_rew_mean          | 610           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1400          |
|    time_elapsed         | 2543          |
|    total_timesteps      | 358400        |
| train/                  |               |
|    approx_kl            | 3.1739473e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.000365     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0791        |
|    n_updates            | 13990         |
|    policy_gradient_loss | -8.58e-05     |
|    value_loss           | 0.165         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.54e+04      |
|    ep_rew_mean          | 610           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1409          |
|    time_elapsed         | 2559          |
|    total_timesteps      | 360704        |
| train/                  |               |
|    approx_kl            | 3.1890813e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 1.2e-05       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0781        |
|    n_updates            | 14080         |
|    policy_gradient_loss | -0.00011      |
|    value_loss           | 0.129         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.54e+04     |
|    ep_rew_mean          | 610          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1418         |
|    time_elapsed         | 2575         |
|    total_timesteps      | 363008       |
| train/                  |              |
|    approx_kl            | 8.614734e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | 0.013        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0693       |
|    n_updates            | 14170        |
|    policy_gradient_loss | -2.39e-05    |
|    value_loss           | 0.0965       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.52e+04     |
|    ep_rew_mean          | 625          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1427         |
|    time_elapsed         | 2592         |
|    total_timesteps      | 365312       |
| train/                  |              |
|    approx_kl            | 7.683411e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | 1.13e-06     |
|    learning_rate        | 1e-06        |
|    loss                 | 420          |
|    n_updates            | 14260        |
|    policy_gradient_loss | 6.98e-07     |
|    value_loss           | 953          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 625           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1437          |
|    time_elapsed         | 2610          |
|    total_timesteps      | 367872        |
| train/                  |               |
|    approx_kl            | 4.7089998e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -1.78e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0757        |
|    n_updates            | 14360         |
|    policy_gradient_loss | -0.000117     |
|    value_loss           | 0.116         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 625           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1446          |
|    time_elapsed         | 2627          |
|    total_timesteps      | 370176        |
| train/                  |               |
|    approx_kl            | 2.0246953e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.000213     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.044         |
|    n_updates            | 14450         |
|    policy_gradient_loss | -0.000128     |
|    value_loss           | 0.0897        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.52e+04     |
|    ep_rew_mean          | 625          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1455         |
|    time_elapsed         | 2644         |
|    total_timesteps      | 372480       |
| train/                  |              |
|    approx_kl            | 7.073395e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | -0.012       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0643       |
|    n_updates            | 14540        |
|    policy_gradient_loss | -8.27e-05    |
|    value_loss           | 0.149        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 625           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1465          |
|    time_elapsed         | 2663          |
|    total_timesteps      | 375040        |
| train/                  |               |
|    approx_kl            | 6.5518543e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.000101     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.138         |
|    n_updates            | 14640         |
|    policy_gradient_loss | -5.46e-05     |
|    value_loss           | 0.306         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.52e+04     |
|    ep_rew_mean          | 625          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1474         |
|    time_elapsed         | 2680         |
|    total_timesteps      | 377344       |
| train/                  |              |
|    approx_kl            | 8.277362e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | -4.94e-05    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0923       |
|    n_updates            | 14730        |
|    policy_gradient_loss | -0.000229    |
|    value_loss           | 0.217        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.52e+04     |
|    ep_rew_mean          | 625          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1483         |
|    time_elapsed         | 2697         |
|    total_timesteps      | 379648       |
| train/                  |              |
|    approx_kl            | 3.027264e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | 8.88e-05     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0749       |
|    n_updates            | 14820        |
|    policy_gradient_loss | -0.000105    |
|    value_loss           | 0.146        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 645           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1492          |
|    time_elapsed         | 2714          |
|    total_timesteps      | 381952        |
| train/                  |               |
|    approx_kl            | 6.0184393e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 0.000431      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0493        |
|    n_updates            | 14910         |
|    policy_gradient_loss | -5.07e-05     |
|    value_loss           | 0.116         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.52e+04     |
|    ep_rew_mean          | 645          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1501         |
|    time_elapsed         | 2730         |
|    total_timesteps      | 384256       |
| train/                  |              |
|    approx_kl            | 7.248018e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | -5.01e-05    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0453       |
|    n_updates            | 15000        |
|    policy_gradient_loss | -6.72e-05    |
|    value_loss           | 0.1          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 645           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1510          |
|    time_elapsed         | 2745          |
|    total_timesteps      | 386560        |
| train/                  |               |
|    approx_kl            | 5.7695433e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 8.36e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0416        |
|    n_updates            | 15090         |
|    policy_gradient_loss | -5.33e-05     |
|    value_loss           | 0.141         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.52e+04     |
|    ep_rew_mean          | 645          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1519         |
|    time_elapsed         | 2761         |
|    total_timesteps      | 388864       |
| train/                  |              |
|    approx_kl            | 4.172325e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | -9.52e-05    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0572       |
|    n_updates            | 15180        |
|    policy_gradient_loss | -6.54e-05    |
|    value_loss           | 0.107        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 645           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1528          |
|    time_elapsed         | 2777          |
|    total_timesteps      | 391168        |
| train/                  |               |
|    approx_kl            | 5.2223913e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 0.000449      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.101         |
|    n_updates            | 15270         |
|    policy_gradient_loss | -3.51e-05     |
|    value_loss           | 0.22          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 645           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1537          |
|    time_elapsed         | 2793          |
|    total_timesteps      | 393472        |
| train/                  |               |
|    approx_kl            | 4.1443855e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.00701      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.204         |
|    n_updates            | 15360         |
|    policy_gradient_loss | -6.25e-06     |
|    value_loss           | 0.359         |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.52e+04     |
|    ep_rew_mean          | 645          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 1546         |
|    time_elapsed         | 2808         |
|    total_timesteps      | 395776       |
| train/                  |              |
|    approx_kl            | 9.941868e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | 0.0411       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0463       |
|    n_updates            | 15450        |
|    policy_gradient_loss | -3.15e-05    |
|    value_loss           | 0.0963       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 645           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1555          |
|    time_elapsed         | 2824          |
|    total_timesteps      | 398080        |
| train/                  |               |
|    approx_kl            | 1.6032718e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.00518      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0686        |
|    n_updates            | 15540         |
|    policy_gradient_loss | -0.000165     |
|    value_loss           | 0.13          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 645           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 1564          |
|    time_elapsed         | 2840          |
|    total_timesteps      | 400384        |
| train/                  |               |
|    approx_kl            | 1.2770761e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.000275     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0434        |
|    n_updates            | 15630         |
|    policy_gradient_loss | -0.000144     |
|    value_loss           | 0.0946        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.52e+04      |
|    ep_rew_mean          | 645           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1573          |
|    time_elapsed         | 2855          |
|    total_timesteps      | 402688        |
| train/                  |               |
|    approx_kl            | 4.1513704e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 7.12e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0522        |
|    n_updates            | 15720         |
|    policy_gradient_loss | -3.43e-05     |
|    value_loss           | 0.0961        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 640           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1582          |
|    time_elapsed         | 2871          |
|    total_timesteps      | 404992        |
| train/                  |               |
|    approx_kl            | 4.3725595e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -1.96e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0496        |
|    n_updates            | 15810         |
|    policy_gradient_loss | -4.8e-05      |
|    value_loss           | 0.108         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.56e+04     |
|    ep_rew_mean          | 640          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1591         |
|    time_elapsed         | 2886         |
|    total_timesteps      | 407296       |
| train/                  |              |
|    approx_kl            | 7.362105e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | -0.0108      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0565       |
|    n_updates            | 15900        |
|    policy_gradient_loss | -8.01e-05    |
|    value_loss           | 0.0886       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 640           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1600          |
|    time_elapsed         | 2902          |
|    total_timesteps      | 409600        |
| train/                  |               |
|    approx_kl            | 8.8475645e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | 0.0375        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0445        |
|    n_updates            | 15990         |
|    policy_gradient_loss | -8.77e-05     |
|    value_loss           | 0.103         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.56e+04     |
|    ep_rew_mean          | 640          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1609         |
|    time_elapsed         | 2918         |
|    total_timesteps      | 411904       |
| train/                  |              |
|    approx_kl            | 6.509945e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | 0.00802      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0475       |
|    n_updates            | 16080        |
|    policy_gradient_loss | -5.82e-05    |
|    value_loss           | 0.112        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 640           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1618          |
|    time_elapsed         | 2933          |
|    total_timesteps      | 414208        |
| train/                  |               |
|    approx_kl            | 7.7323057e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.00767      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.1           |
|    n_updates            | 16170         |
|    policy_gradient_loss | -3.69e-05     |
|    value_loss           | 0.227         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 640           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1627          |
|    time_elapsed         | 2948          |
|    total_timesteps      | 416512        |
| train/                  |               |
|    approx_kl            | 1.4412217e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.00757      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.145         |
|    n_updates            | 16260         |
|    policy_gradient_loss | -2.26e-05     |
|    value_loss           | 0.25          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 640           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1636          |
|    time_elapsed         | 2964          |
|    total_timesteps      | 418816        |
| train/                  |               |
|    approx_kl            | 4.1956082e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.00599       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0481        |
|    n_updates            | 16350         |
|    policy_gradient_loss | -5.1e-05      |
|    value_loss           | 0.098         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.56e+04     |
|    ep_rew_mean          | 640          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1645         |
|    time_elapsed         | 2980         |
|    total_timesteps      | 421120       |
| train/                  |              |
|    approx_kl            | 5.532056e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | -0.0107      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0524       |
|    n_updates            | 16440        |
|    policy_gradient_loss | -4.9e-05     |
|    value_loss           | 0.109        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 640           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1654          |
|    time_elapsed         | 2995          |
|    total_timesteps      | 423424        |
| train/                  |               |
|    approx_kl            | 1.2051081e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.0197       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0383        |
|    n_updates            | 16530         |
|    policy_gradient_loss | -0.000428     |
|    value_loss           | 0.0923        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.57e+04     |
|    ep_rew_mean          | 651          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1663         |
|    time_elapsed         | 3010         |
|    total_timesteps      | 425728       |
| train/                  |              |
|    approx_kl            | 3.387686e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | -0.0116      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0389       |
|    n_updates            | 16620        |
|    policy_gradient_loss | -6.22e-05    |
|    value_loss           | 0.0919       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1673          |
|    time_elapsed         | 3027          |
|    total_timesteps      | 428288        |
| train/                  |               |
|    approx_kl            | 2.4425332e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.0614       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0426        |
|    n_updates            | 16720         |
|    policy_gradient_loss | -0.000129     |
|    value_loss           | 0.0945        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1682          |
|    time_elapsed         | 3044          |
|    total_timesteps      | 430592        |
| train/                  |               |
|    approx_kl            | 1.7508864e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.000172     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0503        |
|    n_updates            | 16810         |
|    policy_gradient_loss | -1.54e-07     |
|    value_loss           | 0.0896        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1691          |
|    time_elapsed         | 3059          |
|    total_timesteps      | 432896        |
| train/                  |               |
|    approx_kl            | 1.4591496e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.000143      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0454        |
|    n_updates            | 16900         |
|    policy_gradient_loss | -0.000145     |
|    value_loss           | 0.115         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.57e+04     |
|    ep_rew_mean          | 651          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1700         |
|    time_elapsed         | 3075         |
|    total_timesteps      | 435200       |
| train/                  |              |
|    approx_kl            | 6.670598e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.000335     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.149        |
|    n_updates            | 16990        |
|    policy_gradient_loss | -9.36e-05    |
|    value_loss           | 0.282        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1709          |
|    time_elapsed         | 3090          |
|    total_timesteps      | 437504        |
| train/                  |               |
|    approx_kl            | 1.3755634e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.00587      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.106         |
|    n_updates            | 17080         |
|    policy_gradient_loss | -6.19e-05     |
|    value_loss           | 0.257         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1718          |
|    time_elapsed         | 3105          |
|    total_timesteps      | 439808        |
| train/                  |               |
|    approx_kl            | 2.6798807e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.011         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0554        |
|    n_updates            | 17170         |
|    policy_gradient_loss | -2.26e-05     |
|    value_loss           | 0.117         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1727          |
|    time_elapsed         | 3121          |
|    total_timesteps      | 442112        |
| train/                  |               |
|    approx_kl            | 4.4796616e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.00168       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0453        |
|    n_updates            | 17260         |
|    policy_gradient_loss | -8.49e-05     |
|    value_loss           | 0.107         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.57e+04     |
|    ep_rew_mean          | 651          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1736         |
|    time_elapsed         | 3137         |
|    total_timesteps      | 444416       |
| train/                  |              |
|    approx_kl            | 9.140931e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 5.26e-05     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.041        |
|    n_updates            | 17350        |
|    policy_gradient_loss | -8.13e-05    |
|    value_loss           | 0.0885       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1745          |
|    time_elapsed         | 3152          |
|    total_timesteps      | 446720        |
| train/                  |               |
|    approx_kl            | 1.0691583e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -9.66e-06     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.064         |
|    n_updates            | 17440         |
|    policy_gradient_loss | -0.000111     |
|    value_loss           | 0.123         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1754          |
|    time_elapsed         | 3168          |
|    total_timesteps      | 449024        |
| train/                  |               |
|    approx_kl            | 6.0047023e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.000232     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0564        |
|    n_updates            | 17530         |
|    policy_gradient_loss | -8.85e-05     |
|    value_loss           | 0.124         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1764          |
|    time_elapsed         | 3185          |
|    total_timesteps      | 451584        |
| train/                  |               |
|    approx_kl            | 3.7455233e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.9          |
|    explained_variance   | -0.00528      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.112         |
|    n_updates            | 17630         |
|    policy_gradient_loss | -0.000599     |
|    value_loss           | 0.257         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 651          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1773         |
|    time_elapsed         | 3201         |
|    total_timesteps      | 453888       |
| train/                  |              |
|    approx_kl            | 5.662441e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | -0.00519     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0425       |
|    n_updates            | 17720        |
|    policy_gradient_loss | -6.18e-05    |
|    value_loss           | 0.0907       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 651          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 1782         |
|    time_elapsed         | 3216         |
|    total_timesteps      | 456192       |
| train/                  |              |
|    approx_kl            | 6.374903e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.00231      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0601       |
|    n_updates            | 17810        |
|    policy_gradient_loss | -6.84e-05    |
|    value_loss           | 0.107        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1791          |
|    time_elapsed         | 3231          |
|    total_timesteps      | 458496        |
| train/                  |               |
|    approx_kl            | 2.0272564e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0061        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.104         |
|    n_updates            | 17900         |
|    policy_gradient_loss | -6.17e-05     |
|    value_loss           | 0.213         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1800          |
|    time_elapsed         | 3247          |
|    total_timesteps      | 460800        |
| train/                  |               |
|    approx_kl            | 2.6151538e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.0442       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.182         |
|    n_updates            | 17990         |
|    policy_gradient_loss | -0.000155     |
|    value_loss           | 0.372         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 651           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1809          |
|    time_elapsed         | 3263          |
|    total_timesteps      | 463104        |
| train/                  |               |
|    approx_kl            | 6.0210004e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.000968      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0464        |
|    n_updates            | 18080         |
|    policy_gradient_loss | -5.87e-05     |
|    value_loss           | 0.0929        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 657           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1818          |
|    time_elapsed         | 3278          |
|    total_timesteps      | 465408        |
| train/                  |               |
|    approx_kl            | 1.1618249e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.00239       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0488        |
|    n_updates            | 18170         |
|    policy_gradient_loss | -7.48e-06     |
|    value_loss           | 0.0956        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 657           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1827          |
|    time_elapsed         | 3294          |
|    total_timesteps      | 467712        |
| train/                  |               |
|    approx_kl            | 2.2538006e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0893        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0529        |
|    n_updates            | 18260         |
|    policy_gradient_loss | -9.87e-05     |
|    value_loss           | 0.0989        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 657           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1836          |
|    time_elapsed         | 3310          |
|    total_timesteps      | 470016        |
| train/                  |               |
|    approx_kl            | 2.4656765e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0205        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0474        |
|    n_updates            | 18350         |
|    policy_gradient_loss | -0.000116     |
|    value_loss           | 0.09          |
-------------------------------------------
--------------------------------------------
| rollout/                |    

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 657           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1845          |
|    time_elapsed         | 3325          |
|    total_timesteps      | 472320        |
| train/                  |               |
|    approx_kl            | 3.1176023e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.000141      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0626        |
|    n_updates            | 18440         |
|    policy_gradient_loss | -3.68e-05     |
|    value_loss           | 0.11          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 657           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1854          |
|    time_elapsed         | 3341          |
|    total_timesteps      | 474624        |
| train/                  |               |
|    approx_kl            | 1.2968667e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.00872       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0999        |
|    n_updates            | 18530         |
|    policy_gradient_loss | -2.03e-05     |
|    value_loss           | 0.215         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 657          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1863         |
|    time_elapsed         | 3356         |
|    total_timesteps      | 476928       |
| train/                  |              |
|    approx_kl            | 7.718336e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.00131      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0889       |
|    n_updates            | 18620        |
|    policy_gradient_loss | -3.36e-05    |
|    value_loss           | 0.229        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 657          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1872         |
|    time_elapsed         | 3371         |
|    total_timesteps      | 479232       |
| train/                  |              |
|    approx_kl            | 5.175825e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.0166       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0521       |
|    n_updates            | 18710        |
|    policy_gradient_loss | -5.98e-05    |
|    value_loss           | 0.0866       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 659           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1881          |
|    time_elapsed         | 3388          |
|    total_timesteps      | 481536        |
| train/                  |               |
|    approx_kl            | 3.8160942e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0311        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0745        |
|    n_updates            | 18800         |
|    policy_gradient_loss | -2.81e-05     |
|    value_loss           | 0.157         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 659           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1891          |
|    time_elapsed         | 3404          |
|    total_timesteps      | 484096        |
| train/                  |               |
|    approx_kl            | 6.1653554e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.0392       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0465        |
|    n_updates            | 18900         |
|    policy_gradient_loss | -7.59e-05     |
|    value_loss           | 0.0936        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 659          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1900         |
|    time_elapsed         | 3420         |
|    total_timesteps      | 486400       |
| train/                  |              |
|    approx_kl            | 2.165325e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.0235       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0392       |
|    n_updates            | 18990        |
|    policy_gradient_loss | -3.21e-05    |
|    value_loss           | 0.0866       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 659          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1910         |
|    time_elapsed         | 3437         |
|    total_timesteps      | 488960       |
| train/                  |              |
|    approx_kl            | 7.450581e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | -0.000297    |
|    learning_rate        | 1e-06        |
|    loss                 | 453          |
|    n_updates            | 19090        |
|    policy_gradient_loss | -1.92e-06    |
|    value_loss           | 965          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 659           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1919          |
|    time_elapsed         | 3454          |
|    total_timesteps      | 491264        |
| train/                  |               |
|    approx_kl            | 1.5478581e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.0129       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0906        |
|    n_updates            | 19180         |
|    policy_gradient_loss | -0.000181     |
|    value_loss           | 0.206         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 659          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1928         |
|    time_elapsed         | 3470         |
|    total_timesteps      | 493568       |
| train/                  |              |
|    approx_kl            | 5.539041e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.00145      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.1          |
|    n_updates            | 19270        |
|    policy_gradient_loss | -8.01e-05    |
|    value_loss           | 0.228        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 659           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1937          |
|    time_elapsed         | 3487          |
|    total_timesteps      | 495872        |
| train/                  |               |
|    approx_kl            | 4.7450885e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0301        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0351        |
|    n_updates            | 19360         |
|    policy_gradient_loss | -4.63e-05     |
|    value_loss           | 0.0844        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 656           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1946          |
|    time_elapsed         | 3503          |
|    total_timesteps      | 498176        |
| train/                  |               |
|    approx_kl            | 2.7078204e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0124        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0494        |
|    n_updates            | 19450         |
|    policy_gradient_loss | -3.15e-05     |
|    value_loss           | 0.094         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 656          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1955         |
|    time_elapsed         | 3521         |
|    total_timesteps      | 500480       |
| train/                  |              |
|    approx_kl            | 2.621673e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | -0.0184      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0722       |
|    n_updates            | 19540        |
|    policy_gradient_loss | -4.17e-05    |
|    value_loss           | 0.126        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 656          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1964         |
|    time_elapsed         | 3538         |
|    total_timesteps      | 502784       |
| train/                  |              |
|    approx_kl            | 8.030329e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | -0.000939    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0398       |
|    n_updates            | 19630        |
|    policy_gradient_loss | -7.04e-05    |
|    value_loss           | 0.0874       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 656          |
| time/                   |              |
|    fps                  | 142          |
|    iterations           | 1973         |
|    time_elapsed         | 3555         |
|    total_timesteps      | 505088       |
| train/                  |              |
|    approx_kl            | 6.030314e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.0427       |
|    learning_rate        | 1e-06        |
|    loss                 | 354          |
|    n_updates            | 19720        |
|    policy_gradient_loss | 1.8e-05      |
|    value_loss           | 733          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 656           |
| time/                   |               |
|    fps                  | 142           |
|    iterations           | 1982          |
|    time_elapsed         | 3572          |
|    total_timesteps      | 507392        |
| train/                  |               |
|    approx_kl            | 2.1220418e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.000123     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0865        |
|    n_updates            | 19810         |
|    policy_gradient_loss | -0.000359     |
|    value_loss           | 0.247         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 656           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 1991          |
|    time_elapsed         | 3589          |
|    total_timesteps      | 509696        |
| train/                  |               |
|    approx_kl            | 1.5841797e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.000175     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.112         |
|    n_updates            | 19900         |
|    policy_gradient_loss | -8.96e-05     |
|    value_loss           | 0.257         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.6e+04     |
|    ep_rew_mean          | 656         |
| time/                   |             |
|    fps                  | 141         |
|    iterations           | 2000        |
|    time_elapsed         | 3607        |
|    total_timesteps      | 512000      |
| train/                  |             |
|    approx_kl            | 8.73371e-06 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.89       |
|    explained_variance   | -0.000355   |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0478      |
|    n_updates            | 19990       |
|    policy_gradient_loss | -0.00016    |
|    value_loss           | 0.0951      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 655           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2009          |
|    time_elapsed         | 3624          |
|    total_timesteps      | 514304        |
| train/                  |               |
|    approx_kl            | 3.1734817e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0165        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0531        |
|    n_updates            | 20080         |
|    policy_gradient_loss | -4.08e-05     |
|    value_loss           | 0.0912        |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 655          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 2018         |
|    time_elapsed         | 3641         |
|    total_timesteps      | 516608       |
| train/                  |              |
|    approx_kl            | 4.940666e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.0174       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0544       |
|    n_updates            | 20170        |
|    policy_gradient_loss | -8.93e-05    |
|    value_loss           | 0.114        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 655           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2028          |
|    time_elapsed         | 3660          |
|    total_timesteps      | 519168        |
| train/                  |               |
|    approx_kl            | 1.2060627e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0117        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0527        |
|    n_updates            | 20270         |
|    policy_gradient_loss | -1.48e-05     |
|    value_loss           | 0.0935        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 655          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 2037         |
|    time_elapsed         | 3677         |
|    total_timesteps      | 521472       |
| train/                  |              |
|    approx_kl            | 7.683411e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | -2.62e-06    |
|    learning_rate        | 1e-06        |
|    loss                 | 331          |
|    n_updates            | 20360        |
|    policy_gradient_loss | 1.86e-07     |
|    value_loss           | 589          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.59e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2046          |
|    time_elapsed         | 3694          |
|    total_timesteps      | 523776        |
| train/                  |               |
|    approx_kl            | 8.1490725e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -1.19e-07     |
|    learning_rate        | 1e-06         |
|    loss                 | 674           |
|    n_updates            | 20450         |
|    policy_gradient_loss | -7.86e-07     |
|    value_loss           | 1.29e+03      |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.59e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2055          |
|    time_elapsed         | 3711          |
|    total_timesteps      | 526080        |
| train/                  |               |
|    approx_kl            | 1.2682285e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.00575      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.065         |
|    n_updates            | 20540         |
|    policy_gradient_loss | -1.77e-05     |
|    value_loss           | 0.122         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.59e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2064          |
|    time_elapsed         | 3729          |
|    total_timesteps      | 528384        |
| train/                  |               |
|    approx_kl            | 1.1948869e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -2.07e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0703        |
|    n_updates            | 20630         |
|    policy_gradient_loss | -4.33e-05     |
|    value_loss           | 0.123         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.59e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2073          |
|    time_elapsed         | 3746          |
|    total_timesteps      | 530688        |
| train/                  |               |
|    approx_kl            | 7.3737465e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.00104       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0531        |
|    n_updates            | 20720         |
|    policy_gradient_loss | -6.23e-05     |
|    value_loss           | 0.0919        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.59e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2082          |
|    time_elapsed         | 3763          |
|    total_timesteps      | 532992        |
| train/                  |               |
|    approx_kl            | 2.1024607e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.0386       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0892        |
|    n_updates            | 20810         |
|    policy_gradient_loss | -4.57e-05     |
|    value_loss           | 0.256         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.59e+04     |
|    ep_rew_mean          | 683          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 2091         |
|    time_elapsed         | 3780         |
|    total_timesteps      | 535296       |
| train/                  |              |
|    approx_kl            | 4.307367e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.025        |
|    learning_rate        | 1e-06        |
|    loss                 | 87.2         |
|    n_updates            | 20900        |
|    policy_gradient_loss | -8.83e-07    |
|    value_loss           | 176          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.59e+04     |
|    ep_rew_mean          | 683          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 2100         |
|    time_elapsed         | 3798         |
|    total_timesteps      | 537600       |
| train/                  |              |
|    approx_kl            | 9.848736e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.00538      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0815       |
|    n_updates            | 20990        |
|    policy_gradient_loss | -7.86e-05    |
|    value_loss           | 0.131        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.59e+04      |
|    ep_rew_mean          | 684           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2109          |
|    time_elapsed         | 3815          |
|    total_timesteps      | 539904        |
| train/                  |               |
|    approx_kl            | 5.9371814e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0109        |
|    learning_rate        | 1e-06         |
|    loss                 | 8.29          |
|    n_updates            | 21080         |
|    policy_gradient_loss | 3.94e-06      |
|    value_loss           | 20.2          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.59e+04      |
|    ep_rew_mean          | 684           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2118          |
|    time_elapsed         | 3833          |
|    total_timesteps      | 542208        |
| train/                  |               |
|    approx_kl            | 2.9755756e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0173        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.052         |
|    n_updates            | 21170         |
|    policy_gradient_loss | -5.02e-05     |
|    value_loss           | 0.0911        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.59e+04      |
|    ep_rew_mean          | 684           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2127          |
|    time_elapsed         | 3851          |
|    total_timesteps      | 544512        |
| train/                  |               |
|    approx_kl            | 5.1436946e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.000119     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0629        |
|    n_updates            | 21260         |
|    policy_gradient_loss | -0.000543     |
|    value_loss           | 0.103         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.59e+04      |
|    ep_rew_mean          | 684           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2136          |
|    time_elapsed         | 3868          |
|    total_timesteps      | 546816        |
| train/                  |               |
|    approx_kl            | 8.1723556e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.000264      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0478        |
|    n_updates            | 21350         |
|    policy_gradient_loss | -7.94e-05     |
|    value_loss           | 0.0877        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 685           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2145          |
|    time_elapsed         | 3885          |
|    total_timesteps      | 549120        |
| train/                  |               |
|    approx_kl            | 9.2433766e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.00202      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0645        |
|    n_updates            | 21440         |
|    policy_gradient_loss | -2.34e-05     |
|    value_loss           | 0.103         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.57e+04      |
|    ep_rew_mean          | 685           |
| time/                   |               |
|    fps                  | 141           |
|    iterations           | 2154          |
|    time_elapsed         | 3903          |
|    total_timesteps      | 551424        |
| train/                  |               |
|    approx_kl            | 1.3888348e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.000836      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0528        |
|    n_updates            | 21530         |
|    policy_gradient_loss | -7.16e-05     |
|    value_loss           | 0.106         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.57e+04     |
|    ep_rew_mean          | 685          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 2163         |
|    time_elapsed         | 3921         |
|    total_timesteps      | 553728       |
| train/                  |              |
|    approx_kl            | 1.855637e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.0278       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0439       |
|    n_updates            | 21620        |
|    policy_gradient_loss | -0.000176    |
|    value_loss           | 0.0947       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.57e+04     |
|    ep_rew_mean          | 685          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 2172         |
|    time_elapsed         | 3938         |
|    total_timesteps      | 556032       |
| train/                  |              |
|    approx_kl            | 2.658926e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | -0.0136      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0489       |
|    n_updates            | 21710        |
|    policy_gradient_loss | -4.46e-05    |
|    value_loss           | 0.11         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.57e+04     |
|    ep_rew_mean          | 685          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 2182         |
|    time_elapsed         | 3957         |
|    total_timesteps      | 558592       |
| train/                  |              |
|    approx_kl            | 5.518086e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.121        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.151        |
|    n_updates            | 21810        |
|    policy_gradient_loss | -6.64e-05    |
|    value_loss           | 0.386        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.56e+04     |
|    ep_rew_mean          | 687          |
| time/                   |              |
|    fps                  | 141          |
|    iterations           | 2191         |
|    time_elapsed         | 3975         |
|    total_timesteps      | 560896       |
| train/                  |              |
|    approx_kl            | 1.010485e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.0156       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0705       |
|    n_updates            | 21900        |
|    policy_gradient_loss | -1.96e-05    |
|    value_loss           | 0.206        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2200          |
|    time_elapsed         | 3994          |
|    total_timesteps      | 563200        |
| train/                  |               |
|    approx_kl            | 1.0470394e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.000252     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0686        |
|    n_updates            | 21990         |
|    policy_gradient_loss | -9.49e-05     |
|    value_loss           | 0.126         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2209          |
|    time_elapsed         | 4012          |
|    total_timesteps      | 565504        |
| train/                  |               |
|    approx_kl            | 4.1583553e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.0243       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.047         |
|    n_updates            | 22080         |
|    policy_gradient_loss | -4.8e-05      |
|    value_loss           | 0.094         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2218          |
|    time_elapsed         | 4029          |
|    total_timesteps      | 567808        |
| train/                  |               |
|    approx_kl            | 3.9695296e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -5.26e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0476        |
|    n_updates            | 22170         |
|    policy_gradient_loss | -7.99e-05     |
|    value_loss           | 0.0883        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

--------------------------------------------
| rollout/                |                |
|    ep_len_mean          | 1.56e+04       |
|    ep_rew_mean          | 687            |
| time/                   |                |
|    fps                  | 140            |
|    iterations           | 2227           |
|    time_elapsed         | 4047           |
|    total_timesteps      | 570112         |
| train/                  |                |
|    approx_kl            | 1.10827386e-07 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -1.89          |
|    explained_variance   | -0.0415        |
|    learning_rate        | 1e-06          |
|    loss                 | 0.0969         |
|    n_updates            | 22260          |
|    policy_gradient_loss | -1.21e-05      |
|    value_loss           | 0.223          |
--------------------------------------------
------------------------------------------
| rollout/  

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.56e+04     |
|    ep_rew_mean          | 687          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2236         |
|    time_elapsed         | 4064         |
|    total_timesteps      | 572416       |
| train/                  |              |
|    approx_kl            | 5.958136e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | -0.00303     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.127        |
|    n_updates            | 22350        |
|    policy_gradient_loss | -6.73e-05    |
|    value_loss           | 0.257        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2245          |
|    time_elapsed         | 4081          |
|    total_timesteps      | 574720        |
| train/                  |               |
|    approx_kl            | 1.1194497e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.000229     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0398        |
|    n_updates            | 22440         |
|    policy_gradient_loss | -7.27e-05     |
|    value_loss           | 0.0982        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2254          |
|    time_elapsed         | 4098          |
|    total_timesteps      | 577024        |
| train/                  |               |
|    approx_kl            | 2.4680048e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.0222       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0546        |
|    n_updates            | 22530         |
|    policy_gradient_loss | -3.8e-05      |
|    value_loss           | 0.101         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.56e+04     |
|    ep_rew_mean          | 687          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2263         |
|    time_elapsed         | 4115         |
|    total_timesteps      | 579328       |
| train/                  |              |
|    approx_kl            | 5.271286e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.0115       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0452       |
|    n_updates            | 22620        |
|    policy_gradient_loss | -2.39e-05    |
|    value_loss           | 0.101        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.56e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2272          |
|    time_elapsed         | 4133          |
|    total_timesteps      | 581632        |
| train/                  |               |
|    approx_kl            | 1.6577542e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.0104       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0712        |
|    n_updates            | 22710         |
|    policy_gradient_loss | -2.78e-05     |
|    value_loss           | 0.16          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.56e+04     |
|    ep_rew_mean          | 687          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2281         |
|    time_elapsed         | 4150         |
|    total_timesteps      | 583936       |
| train/                  |              |
|    approx_kl            | 7.136259e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | -0.00488     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0362       |
|    n_updates            | 22800        |
|    policy_gradient_loss | -6.71e-05    |
|    value_loss           | 0.0885       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2290          |
|    time_elapsed         | 4167          |
|    total_timesteps      | 586240        |
| train/                  |               |
|    approx_kl            | 5.2577816e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0129        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0356        |
|    n_updates            | 22890         |
|    policy_gradient_loss | -8.99e-05     |
|    value_loss           | 0.0985        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2299          |
|    time_elapsed         | 4184          |
|    total_timesteps      | 588544        |
| train/                  |               |
|    approx_kl            | 2.0721927e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0154        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0487        |
|    n_updates            | 22980         |
|    policy_gradient_loss | -2.34e-05     |
|    value_loss           | 0.0868        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.58e+04     |
|    ep_rew_mean          | 683          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2308         |
|    time_elapsed         | 4201         |
|    total_timesteps      | 590848       |
| train/                  |              |
|    approx_kl            | 2.614688e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | -0.000817    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0504       |
|    n_updates            | 23070        |
|    policy_gradient_loss | -3.13e-05    |
|    value_loss           | 0.117        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2317          |
|    time_elapsed         | 4218          |
|    total_timesteps      | 593152        |
| train/                  |               |
|    approx_kl            | 6.0535967e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.0567        |
|    learning_rate        | 1e-06         |
|    loss                 | 22.2          |
|    n_updates            | 23160         |
|    policy_gradient_loss | -4.01e-06     |
|    value_loss           | 38.2          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2326          |
|    time_elapsed         | 4235          |
|    total_timesteps      | 595456        |
| train/                  |               |
|    approx_kl            | 1.5483238e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | 0.00241       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.115         |
|    n_updates            | 23250         |
|    policy_gradient_loss | -3.92e-05     |
|    value_loss           | 0.239         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 683           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2336          |
|    time_elapsed         | 4254          |
|    total_timesteps      | 598016        |
| train/                  |               |
|    approx_kl            | 1.0966323e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.0312       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.107         |
|    n_updates            | 23350         |
|    policy_gradient_loss | -1.85e-05     |
|    value_loss           | 0.21          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.58e+04     |
|    ep_rew_mean          | 683          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2345         |
|    time_elapsed         | 4272         |
|    total_timesteps      | 600320       |
| train/                  |              |
|    approx_kl            | 3.729947e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.00163      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0488       |
|    n_updates            | 23440        |
|    policy_gradient_loss | -3.46e-05    |
|    value_loss           | 0.0943       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2354          |
|    time_elapsed         | 4289          |
|    total_timesteps      | 602624        |
| train/                  |               |
|    approx_kl            | 1.5925616e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.0187       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0438        |
|    n_updates            | 23530         |
|    policy_gradient_loss | -2.53e-05     |
|    value_loss           | 0.0939        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2363          |
|    time_elapsed         | 4306          |
|    total_timesteps      | 604928        |
| train/                  |               |
|    approx_kl            | 1.9860454e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.00018      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0651        |
|    n_updates            | 23620         |
|    policy_gradient_loss | -1.95e-05     |
|    value_loss           | 0.127         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2372          |
|    time_elapsed         | 4323          |
|    total_timesteps      | 607232        |
| train/                  |               |
|    approx_kl            | 1.0246877e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.013        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0545        |
|    n_updates            | 23710         |
|    policy_gradient_loss | -5.71e-05     |
|    value_loss           | 0.0893        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2382          |
|    time_elapsed         | 4342          |
|    total_timesteps      | 609792        |
| train/                  |               |
|    approx_kl            | 6.3260086e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0357        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.045         |
|    n_updates            | 23810         |
|    policy_gradient_loss | -8.21e-05     |
|    value_loss           | 0.0941        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.58e+04     |
|    ep_rew_mean          | 694          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2391         |
|    time_elapsed         | 4360         |
|    total_timesteps      | 612096       |
| train/                  |              |
|    approx_kl            | 8.381903e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | -0.0145      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0752       |
|    n_updates            | 23900        |
|    policy_gradient_loss | -1.41e-05    |
|    value_loss           | 0.229        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2400          |
|    time_elapsed         | 4377          |
|    total_timesteps      | 614400        |
| train/                  |               |
|    approx_kl            | 3.7252903e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0593        |
|    learning_rate        | 1e-06         |
|    loss                 | 7.62          |
|    n_updates            | 23990         |
|    policy_gradient_loss | -1.49e-05     |
|    value_loss           | 50.8          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.58e+04     |
|    ep_rew_mean          | 694          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2409         |
|    time_elapsed         | 4394         |
|    total_timesteps      | 616704       |
| train/                  |              |
|    approx_kl            | 7.748604e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | -0.000229    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0373       |
|    n_updates            | 24080        |
|    policy_gradient_loss | -6.14e-05    |
|    value_loss           | 0.0909       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2418          |
|    time_elapsed         | 4411          |
|    total_timesteps      | 619008        |
| train/                  |               |
|    approx_kl            | 2.6961789e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.127         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0526        |
|    n_updates            | 24170         |
|    policy_gradient_loss | -4.61e-05     |
|    value_loss           | 0.0955        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2427          |
|    time_elapsed         | 4429          |
|    total_timesteps      | 621312        |
| train/                  |               |
|    approx_kl            | 1.0170043e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.00315      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0629        |
|    n_updates            | 24260         |
|    policy_gradient_loss | -7.82e-05     |
|    value_loss           | 0.127         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2436          |
|    time_elapsed         | 4446          |
|    total_timesteps      | 623616        |
| train/                  |               |
|    approx_kl            | 1.5764963e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0747        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0387        |
|    n_updates            | 24350         |
|    policy_gradient_loss | -0.00018      |
|    value_loss           | 0.105         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 690           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2445          |
|    time_elapsed         | 4463          |
|    total_timesteps      | 625920        |
| train/                  |               |
|    approx_kl            | 2.6077032e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.114         |
|    learning_rate        | 1e-06         |
|    loss                 | 34.4          |
|    n_updates            | 24440         |
|    policy_gradient_loss | -4.11e-06     |
|    value_loss           | 83.8          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 690          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2454         |
|    time_elapsed         | 4480         |
|    total_timesteps      | 628224       |
| train/                  |              |
|    approx_kl            | 8.146744e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | -0.00196     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0673       |
|    n_updates            | 24530        |
|    policy_gradient_loss | -0.000104    |
|    value_loss           | 0.13         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 690           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2463          |
|    time_elapsed         | 4498          |
|    total_timesteps      | 630528        |
| train/                  |               |
|    approx_kl            | 1.7267419e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0023        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.059         |
|    n_updates            | 24620         |
|    policy_gradient_loss | -0.000242     |
|    value_loss           | 0.122         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 690          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2472         |
|    time_elapsed         | 4515         |
|    total_timesteps      | 632832       |
| train/                  |              |
|    approx_kl            | 9.271316e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.00023      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0589       |
|    n_updates            | 24710        |
|    policy_gradient_loss | -0.000112    |
|    value_loss           | 0.115        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 690           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2481          |
|    time_elapsed         | 4532          |
|    total_timesteps      | 635136        |
| train/                  |               |
|    approx_kl            | 2.9965304e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0288        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.166         |
|    n_updates            | 24800         |
|    policy_gradient_loss | -3.26e-05     |
|    value_loss           | 0.307         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 690           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2490          |
|    time_elapsed         | 4549          |
|    total_timesteps      | 637440        |
| train/                  |               |
|    approx_kl            | 3.8295984e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.000413      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.103         |
|    n_updates            | 24890         |
|    policy_gradient_loss | -6.08e-05     |
|    value_loss           | 0.216         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 690           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2499          |
|    time_elapsed         | 4566          |
|    total_timesteps      | 639744        |
| train/                  |               |
|    approx_kl            | 2.4749897e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0352        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0423        |
|    n_updates            | 24980         |
|    policy_gradient_loss | -2.18e-05     |
|    value_loss           | 0.086         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 689           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2508          |
|    time_elapsed         | 4584          |
|    total_timesteps      | 642048        |
| train/                  |               |
|    approx_kl            | 5.2154064e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0562        |
|    learning_rate        | 1e-06         |
|    loss                 | 209           |
|    n_updates            | 25070         |
|    policy_gradient_loss | -1.15e-05     |
|    value_loss           | 558           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 689           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2517          |
|    time_elapsed         | 4601          |
|    total_timesteps      | 644352        |
| train/                  |               |
|    approx_kl            | 1.0654796e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.00265       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0395        |
|    n_updates            | 25160         |
|    policy_gradient_loss | -0.000215     |
|    value_loss           | 0.0887        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 689          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 2526         |
|    time_elapsed         | 4618         |
|    total_timesteps      | 646656       |
| train/                  |              |
|    approx_kl            | 8.101342e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.024        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0594       |
|    n_updates            | 25250        |
|    policy_gradient_loss | -0.000132    |
|    value_loss           | 0.1          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 689           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 2536          |
|    time_elapsed         | 4637          |
|    total_timesteps      | 649216        |
| train/                  |               |
|    approx_kl            | 1.0244548e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.00441       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0429        |
|    n_updates            | 25350         |
|    policy_gradient_loss | -0.00011      |
|    value_loss           | 0.0926        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 689          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2545         |
|    time_elapsed         | 4654         |
|    total_timesteps      | 651520       |
| train/                  |              |
|    approx_kl            | 3.017485e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.00499      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.12         |
|    n_updates            | 25440        |
|    policy_gradient_loss | -4.12e-05    |
|    value_loss           | 0.244        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 689           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2554          |
|    time_elapsed         | 4671          |
|    total_timesteps      | 653824        |
| train/                  |               |
|    approx_kl            | 2.9127114e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.00264       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.104         |
|    n_updates            | 25530         |
|    policy_gradient_loss | -4.84e-05     |
|    value_loss           | 0.209         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 689          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2563         |
|    time_elapsed         | 4688         |
|    total_timesteps      | 656128       |
| train/                  |              |
|    approx_kl            | 7.539056e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.0232       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0518       |
|    n_updates            | 25620        |
|    policy_gradient_loss | -6.75e-05    |
|    value_loss           | 0.0867       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 689           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2573          |
|    time_elapsed         | 4706          |
|    total_timesteps      | 658688        |
| train/                  |               |
|    approx_kl            | 4.0745363e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0185        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0406        |
|    n_updates            | 25720         |
|    policy_gradient_loss | -8.64e-06     |
|    value_loss           | 0.108         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 689          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2582         |
|    time_elapsed         | 4724         |
|    total_timesteps      | 660992       |
| train/                  |              |
|    approx_kl            | 4.954636e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.000174     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.069        |
|    n_updates            | 25810        |
|    policy_gradient_loss | -8.17e-05    |
|    value_loss           | 0.162        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 689          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2592         |
|    time_elapsed         | 4743         |
|    total_timesteps      | 663552       |
| train/                  |              |
|    approx_kl            | 7.892959e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.000111     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.06         |
|    n_updates            | 25910        |
|    policy_gradient_loss | -2.37e-06    |
|    value_loss           | 0.114        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 687          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2601         |
|    time_elapsed         | 4759         |
|    total_timesteps      | 665856       |
| train/                  |              |
|    approx_kl            | 6.167684e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 6.87e-05     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0687       |
|    n_updates            | 26000        |
|    policy_gradient_loss | -7.39e-05    |
|    value_loss           | 0.115        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2610          |
|    time_elapsed         | 4776          |
|    total_timesteps      | 668160        |
| train/                  |               |
|    approx_kl            | 5.7695433e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.0698       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0674        |
|    n_updates            | 26090         |
|    policy_gradient_loss | -6.91e-05     |
|    value_loss           | 0.105         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 687          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2619         |
|    time_elapsed         | 4794         |
|    total_timesteps      | 670464       |
| train/                  |              |
|    approx_kl            | 9.429641e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | -0.0485      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0509       |
|    n_updates            | 26180        |
|    policy_gradient_loss | -5.55e-06    |
|    value_loss           | 0.0948       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2628          |
|    time_elapsed         | 4810          |
|    total_timesteps      | 672768        |
| train/                  |               |
|    approx_kl            | 7.9674646e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.102        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0428        |
|    n_updates            | 26270         |
|    policy_gradient_loss | -3.52e-05     |
|    value_loss           | 0.111         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 687          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2637         |
|    time_elapsed         | 4827         |
|    total_timesteps      | 675072       |
| train/                  |              |
|    approx_kl            | 6.805407e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.00302      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0971       |
|    n_updates            | 26360        |
|    policy_gradient_loss | -6.53e-05    |
|    value_loss           | 0.228        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 687          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2646         |
|    time_elapsed         | 4844         |
|    total_timesteps      | 677376       |
| train/                  |              |
|    approx_kl            | 9.776559e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | -0.000118    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.123        |
|    n_updates            | 26450        |
|    policy_gradient_loss | -7.18e-05    |
|    value_loss           | 0.249        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 688           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2655          |
|    time_elapsed         | 4861          |
|    total_timesteps      | 679680        |
| train/                  |               |
|    approx_kl            | 4.2747706e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.000107      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0848        |
|    n_updates            | 26540         |
|    policy_gradient_loss | -5.51e-05     |
|    value_loss           | 0.138         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 688           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2664          |
|    time_elapsed         | 4878          |
|    total_timesteps      | 681984        |
| train/                  |               |
|    approx_kl            | 4.3283217e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.00062       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0739        |
|    n_updates            | 26630         |
|    policy_gradient_loss | -4.56e-05     |
|    value_loss           | 0.149         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 688           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2673          |
|    time_elapsed         | 4895          |
|    total_timesteps      | 684288        |
| train/                  |               |
|    approx_kl            | 4.3120235e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.000306      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0442        |
|    n_updates            | 26720         |
|    policy_gradient_loss | -8.88e-05     |
|    value_loss           | 0.0888        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 688          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2683         |
|    time_elapsed         | 4913         |
|    total_timesteps      | 686848       |
| train/                  |              |
|    approx_kl            | 8.956995e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | -0.000348    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0531       |
|    n_updates            | 26820        |
|    policy_gradient_loss | -0.000106    |
|    value_loss           | 0.0904       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 688           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2692          |
|    time_elapsed         | 4930          |
|    total_timesteps      | 689152        |
| train/                  |               |
|    approx_kl            | 2.7450733e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.000143      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0955        |
|    n_updates            | 26910         |
|    policy_gradient_loss | -3.26e-05     |
|    value_loss           | 0.213         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 688          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2701         |
|    time_elapsed         | 4947         |
|    total_timesteps      | 691456       |
| train/                  |              |
|    approx_kl            | 4.346948e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | -3.35e-05    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.164        |
|    n_updates            | 27000        |
|    policy_gradient_loss | -3.74e-05    |
|    value_loss           | 0.226        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 688           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2710          |
|    time_elapsed         | 4964          |
|    total_timesteps      | 693760        |
| train/                  |               |
|    approx_kl            | 2.0023435e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0946        |
|    learning_rate        | 1e-06         |
|    loss                 | 47.6          |
|    n_updates            | 27090         |
|    policy_gradient_loss | 5.28e-06      |
|    value_loss           | 168           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.62e+04    |
|    ep_rew_mean          | 687         |
| time/                   |             |
|    fps                  | 139         |
|    iterations           | 2719        |
|    time_elapsed         | 4981        |
|    total_timesteps      | 696064      |
| train/                  |             |
|    approx_kl            | 7.21775e-09 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.88       |
|    explained_variance   | -3.14e-05   |
|    learning_rate        | 1e-06       |
|    loss                 | 442         |
|    n_updates            | 27180       |
|    policy_gradient_loss | -4.37e-07   |
|    value_loss           | 944         |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2728          |
|    time_elapsed         | 4998          |
|    total_timesteps      | 698368        |
| train/                  |               |
|    approx_kl            | 8.1490725e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.0392        |
|    learning_rate        | 1e-06         |
|    loss                 | 38.5          |
|    n_updates            | 27270         |
|    policy_gradient_loss | -3.38e-05     |
|    value_loss           | 77.6          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 687          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2737         |
|    time_elapsed         | 5015         |
|    total_timesteps      | 700672       |
| train/                  |              |
|    approx_kl            | 9.040814e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | -1.55e-06    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0721       |
|    n_updates            | 27360        |
|    policy_gradient_loss | -0.000123    |
|    value_loss           | 0.15         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 687           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2746          |
|    time_elapsed         | 5032          |
|    total_timesteps      | 702976        |
| train/                  |               |
|    approx_kl            | 5.3667463e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -2.85e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.069         |
|    n_updates            | 27450         |
|    policy_gradient_loss | -0.000165     |
|    value_loss           | 0.16          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 701           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2755          |
|    time_elapsed         | 5049          |
|    total_timesteps      | 705280        |
| train/                  |               |
|    approx_kl            | 5.5879354e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -3.58e-07     |
|    learning_rate        | 1e-06         |
|    loss                 | 472           |
|    n_updates            | 27540         |
|    policy_gradient_loss | -1.13e-06     |
|    value_loss           | 917           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 701           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2765          |
|    time_elapsed         | 5067          |
|    total_timesteps      | 707840        |
| train/                  |               |
|    approx_kl            | 5.8929436e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | 0.00542       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0478        |
|    n_updates            | 27640         |
|    policy_gradient_loss | -1.7e-05      |
|    value_loss           | 0.121         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 701           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2774          |
|    time_elapsed         | 5085          |
|    total_timesteps      | 710144        |
| train/                  |               |
|    approx_kl            | 2.7164351e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -2.21e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0512        |
|    n_updates            | 27730         |
|    policy_gradient_loss | -0.000124     |
|    value_loss           | 0.116         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 701          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2784         |
|    time_elapsed         | 5103         |
|    total_timesteps      | 712704       |
| train/                  |              |
|    approx_kl            | 4.300382e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.0137       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0496       |
|    n_updates            | 27830        |
|    policy_gradient_loss | -6.15e-05    |
|    value_loss           | 0.107        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.58e+04     |
|    ep_rew_mean          | 698          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2794         |
|    time_elapsed         | 5122         |
|    total_timesteps      | 715264       |
| train/                  |              |
|    approx_kl            | 8.891802e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.00022      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0513       |
|    n_updates            | 27930        |
|    policy_gradient_loss | -9.81e-05    |
|    value_loss           | 0.102        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2803          |
|    time_elapsed         | 5139          |
|    total_timesteps      | 717568        |
| train/                  |               |
|    approx_kl            | 2.1979213e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.073        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0672        |
|    n_updates            | 28020         |
|    policy_gradient_loss | -1.72e-05     |
|    value_loss           | 0.125         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2812          |
|    time_elapsed         | 5155          |
|    total_timesteps      | 719872        |
| train/                  |               |
|    approx_kl            | 2.3352914e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.0654       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0391        |
|    n_updates            | 28110         |
|    policy_gradient_loss | -3.07e-05     |
|    value_loss           | 0.103         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2821          |
|    time_elapsed         | 5173          |
|    total_timesteps      | 722176        |
| train/                  |               |
|    approx_kl            | 2.3888424e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.0184       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.128         |
|    n_updates            | 28200         |
|    policy_gradient_loss | -3.62e-05     |
|    value_loss           | 0.231         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2830          |
|    time_elapsed         | 5188          |
|    total_timesteps      | 724480        |
| train/                  |               |
|    approx_kl            | 5.1339157e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.88         |
|    explained_variance   | -0.0309       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.121         |
|    n_updates            | 28290         |
|    policy_gradient_loss | -5.96e-05     |
|    value_loss           | 0.204         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2839          |
|    time_elapsed         | 5204          |
|    total_timesteps      | 726784        |
| train/                  |               |
|    approx_kl            | 1.4430843e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -3.31e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0643        |
|    n_updates            | 28380         |
|    policy_gradient_loss | -0.000138     |
|    value_loss           | 0.187         |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.58e+04     |
|    ep_rew_mean          | 698          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2848         |
|    time_elapsed         | 5219         |
|    total_timesteps      | 729088       |
| train/                  |              |
|    approx_kl            | 3.683148e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.00602     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0519       |
|    n_updates            | 28470        |
|    policy_gradient_loss | -5.23e-05    |
|    value_loss           | 0.105        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2857          |
|    time_elapsed         | 5236          |
|    total_timesteps      | 731392        |
| train/                  |               |
|    approx_kl            | 1.8114224e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0234        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0473        |
|    n_updates            | 28560         |
|    policy_gradient_loss | -1.03e-05     |
|    value_loss           | 0.0973        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

--------------------------------------------
| rollout/                |                |
|    ep_len_mean          | 1.58e+04       |
|    ep_rew_mean          | 698            |
| time/                   |                |
|    fps                  | 139            |
|    iterations           | 2866           |
|    time_elapsed         | 5251           |
|    total_timesteps      | 733696         |
| train/                  |                |
|    approx_kl            | 1.04492065e-05 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -1.87          |
|    explained_variance   | 0.000135       |
|    learning_rate        | 1e-06          |
|    loss                 | 0.0584         |
|    n_updates            | 28650          |
|    policy_gradient_loss | -0.000154      |
|    value_loss           | 0.131          |
--------------------------------------------
-------------------------------------------
| rollout/ 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.58e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2875          |
|    time_elapsed         | 5267          |
|    total_timesteps      | 736000        |
| train/                  |               |
|    approx_kl            | 3.4552068e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -1.67e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0413        |
|    n_updates            | 28740         |
|    policy_gradient_loss | -3.58e-05     |
|    value_loss           | 0.0927        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2884          |
|    time_elapsed         | 5283          |
|    total_timesteps      | 738304        |
| train/                  |               |
|    approx_kl            | 2.5383197e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0275       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.046         |
|    n_updates            | 28830         |
|    policy_gradient_loss | -0.000166     |
|    value_loss           | 0.105         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2893          |
|    time_elapsed         | 5299          |
|    total_timesteps      | 740608        |
| train/                  |               |
|    approx_kl            | 1.0336051e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.00711      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0435        |
|    n_updates            | 28920         |
|    policy_gradient_loss | -0.000181     |
|    value_loss           | 0.0881        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2903          |
|    time_elapsed         | 5316          |
|    total_timesteps      | 743168        |
| train/                  |               |
|    approx_kl            | 4.2049214e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0604       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0384        |
|    n_updates            | 29020         |
|    policy_gradient_loss | -5.95e-05     |
|    value_loss           | 0.0922        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2912          |
|    time_elapsed         | 5332          |
|    total_timesteps      | 745472        |
| train/                  |               |
|    approx_kl            | 1.0221265e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0634        |
|    learning_rate        | 1e-06         |
|    loss                 | 230           |
|    n_updates            | 29110         |
|    policy_gradient_loss | 2.37e-05      |
|    value_loss           | 495           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2921          |
|    time_elapsed         | 5348          |
|    total_timesteps      | 747776        |
| train/                  |               |
|    approx_kl            | 7.3364936e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.00184       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.133         |
|    n_updates            | 29200         |
|    policy_gradient_loss | -7.63e-05     |
|    value_loss           | 0.217         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 694          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2930         |
|    time_elapsed         | 5364         |
|    total_timesteps      | 750080       |
| train/                  |              |
|    approx_kl            | 3.996771e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.0213       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.167        |
|    n_updates            | 29290        |
|    policy_gradient_loss | -4.3e-05     |
|    value_loss           | 0.259        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 694           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2939          |
|    time_elapsed         | 5379          |
|    total_timesteps      | 752384        |
| train/                  |               |
|    approx_kl            | 4.6379864e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0911       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0531        |
|    n_updates            | 29380         |
|    policy_gradient_loss | -5.11e-05     |
|    value_loss           | 0.122         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 693          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 2948         |
|    time_elapsed         | 5395         |
|    total_timesteps      | 754688       |
| train/                  |              |
|    approx_kl            | 9.399373e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.0576       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0489       |
|    n_updates            | 29470        |
|    policy_gradient_loss | -0.000127    |
|    value_loss           | 0.107        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2958          |
|    time_elapsed         | 5412          |
|    total_timesteps      | 757248        |
| train/                  |               |
|    approx_kl            | 2.1979213e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.111         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0548        |
|    n_updates            | 29570         |
|    policy_gradient_loss | -3.12e-05     |
|    value_loss           | 0.104         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2967          |
|    time_elapsed         | 5428          |
|    total_timesteps      | 759552        |
| train/                  |               |
|    approx_kl            | 2.2421591e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.00486       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0433        |
|    n_updates            | 29660         |
|    policy_gradient_loss | -2.57e-05     |
|    value_loss           | 0.0895        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2976          |
|    time_elapsed         | 5444          |
|    total_timesteps      | 761856        |
| train/                  |               |
|    approx_kl            | 6.2864274e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0101        |
|    learning_rate        | 1e-06         |
|    loss                 | 461           |
|    n_updates            | 29750         |
|    policy_gradient_loss | -1.68e-06     |
|    value_loss           | 911           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2985          |
|    time_elapsed         | 5459          |
|    total_timesteps      | 764160        |
| train/                  |               |
|    approx_kl            | 1.7462298e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0199       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.122         |
|    n_updates            | 29840         |
|    policy_gradient_loss | -2.07e-05     |
|    value_loss           | 0.261         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 2994          |
|    time_elapsed         | 5475          |
|    total_timesteps      | 766464        |
| train/                  |               |
|    approx_kl            | 3.2479875e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.00126      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0875        |
|    n_updates            | 29930         |
|    policy_gradient_loss | -6.36e-05     |
|    value_loss           | 0.297         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3003          |
|    time_elapsed         | 5490          |
|    total_timesteps      | 768768        |
| train/                  |               |
|    approx_kl            | 3.5623088e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.00833      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0593        |
|    n_updates            | 30020         |
|    policy_gradient_loss | -4.8e-05      |
|    value_loss           | 0.101         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3012          |
|    time_elapsed         | 5506          |
|    total_timesteps      | 771072        |
| train/                  |               |
|    approx_kl            | 2.2845343e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0154        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0471        |
|    n_updates            | 30110         |
|    policy_gradient_loss | -0.000196     |
|    value_loss           | 0.0908        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3021          |
|    time_elapsed         | 5522          |
|    total_timesteps      | 773376        |
| train/                  |               |
|    approx_kl            | 5.9837475e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0464        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0399        |
|    n_updates            | 30200         |
|    policy_gradient_loss | -6.85e-05     |
|    value_loss           | 0.0839        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 697          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 3030         |
|    time_elapsed         | 5537         |
|    total_timesteps      | 775680       |
| train/                  |              |
|    approx_kl            | 7.187482e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.000171     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0463       |
|    n_updates            | 30290        |
|    policy_gradient_loss | -6.28e-05    |
|    value_loss           | 0.099        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 697          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 3040         |
|    time_elapsed         | 5555         |
|    total_timesteps      | 778240       |
| train/                  |              |
|    approx_kl            | 8.312054e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.0913       |
|    learning_rate        | 1e-06        |
|    loss                 | 325          |
|    n_updates            | 30390        |
|    policy_gradient_loss | -1.65e-05    |
|    value_loss           | 632          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3049          |
|    time_elapsed         | 5571          |
|    total_timesteps      | 780544        |
| train/                  |               |
|    approx_kl            | 7.2130933e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0199       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0932        |
|    n_updates            | 30480         |
|    policy_gradient_loss | -8.29e-05     |
|    value_loss           | 0.2           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 697          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 3058         |
|    time_elapsed         | 5586         |
|    total_timesteps      | 782848       |
| train/                  |              |
|    approx_kl            | 1.389999e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.00475     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0816       |
|    n_updates            | 30570        |
|    policy_gradient_loss | -2.61e-05    |
|    value_loss           | 0.189        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3068          |
|    time_elapsed         | 5604          |
|    total_timesteps      | 785408        |
| train/                  |               |
|    approx_kl            | 2.9616058e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.121        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0615        |
|    n_updates            | 30670         |
|    policy_gradient_loss | -3.22e-05     |
|    value_loss           | 0.103         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3077          |
|    time_elapsed         | 5619          |
|    total_timesteps      | 787712        |
| train/                  |               |
|    approx_kl            | 2.5890768e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0206       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.059         |
|    n_updates            | 30760         |
|    policy_gradient_loss | -6.2e-05      |
|    value_loss           | 0.105         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.6e+04     |
|    ep_rew_mean          | 693         |
| time/                   |             |
|    fps                  | 140         |
|    iterations           | 3086        |
|    time_elapsed         | 5636        |
|    total_timesteps      | 790016      |
| train/                  |             |
|    approx_kl            | 4.60539e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.87       |
|    explained_variance   | -0.000929   |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0517      |
|    n_updates            | 30850       |
|    policy_gradient_loss | -4.24e-05   |
|    value_loss           | 0.0981      |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3095          |
|    time_elapsed         | 5652          |
|    total_timesteps      | 792320        |
| train/                  |               |
|    approx_kl            | 1.3047829e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.000474      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0602        |
|    n_updates            | 30940         |
|    policy_gradient_loss | -8.82e-05     |
|    value_loss           | 0.11          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 693          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 3104         |
|    time_elapsed         | 5667         |
|    total_timesteps      | 794624       |
| train/                  |              |
|    approx_kl            | 5.772803e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.00409      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0884       |
|    n_updates            | 31030        |
|    policy_gradient_loss | -0.000272    |
|    value_loss           | 0.172        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.6e+04      |
|    ep_rew_mean          | 693          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 3114         |
|    time_elapsed         | 5685         |
|    total_timesteps      | 797184       |
| train/                  |              |
|    approx_kl            | 4.945323e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.000326    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0866       |
|    n_updates            | 31130        |
|    policy_gradient_loss | -4.55e-05    |
|    value_loss           | 0.215        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3123          |
|    time_elapsed         | 5700          |
|    total_timesteps      | 799488        |
| train/                  |               |
|    approx_kl            | 2.1536835e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0075        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0504        |
|    n_updates            | 31220         |
|    policy_gradient_loss | -2.83e-05     |
|    value_loss           | 0.122         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3133          |
|    time_elapsed         | 5718          |
|    total_timesteps      | 802048        |
| train/                  |               |
|    approx_kl            | 4.6519563e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.000315      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0419        |
|    n_updates            | 31320         |
|    policy_gradient_loss | -6.47e-05     |
|    value_loss           | 0.0923        |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3143          |
|    time_elapsed         | 5736          |
|    total_timesteps      | 804608        |
| train/                  |               |
|    approx_kl            | 4.4726767e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0262        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0503        |
|    n_updates            | 31420         |
|    policy_gradient_loss | -6.56e-05     |
|    value_loss           | 0.11          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3152          |
|    time_elapsed         | 5751          |
|    total_timesteps      | 806912        |
| train/                  |               |
|    approx_kl            | 2.7008355e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0181        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0384        |
|    n_updates            | 31510         |
|    policy_gradient_loss | -4.99e-05     |
|    value_loss           | 0.095         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3161          |
|    time_elapsed         | 5767          |
|    total_timesteps      | 809216        |
| train/                  |               |
|    approx_kl            | 3.1664968e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.045         |
|    learning_rate        | 1e-06         |
|    loss                 | 155           |
|    n_updates            | 31600         |
|    policy_gradient_loss | 7.13e-06      |
|    value_loss           | 225           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3170          |
|    time_elapsed         | 5785          |
|    total_timesteps      | 811520        |
| train/                  |               |
|    approx_kl            | 1.8137507e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.000108     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.106         |
|    n_updates            | 31690         |
|    policy_gradient_loss | -2.07e-05     |
|    value_loss           | 0.253         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

--------------------------------------------
| rollout/                |                |
|    ep_len_mean          | 1.6e+04        |
|    ep_rew_mean          | 692            |
| time/                   |                |
|    fps                  | 140            |
|    iterations           | 3179           |
|    time_elapsed         | 5801           |
|    total_timesteps      | 813824         |
| train/                  |                |
|    approx_kl            | 1.02911144e-07 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -1.87          |
|    explained_variance   | -0.0125        |
|    learning_rate        | 1e-06          |
|    loss                 | 0.117          |
|    n_updates            | 31780          |
|    policy_gradient_loss | -8.52e-06      |
|    value_loss           | 0.26           |
--------------------------------------------
-------------------------------------------
| rollout/ 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3188          |
|    time_elapsed         | 5819          |
|    total_timesteps      | 816128        |
| train/                  |               |
|    approx_kl            | 3.5809353e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.00122       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.041         |
|    n_updates            | 31870         |
|    policy_gradient_loss | -3.57e-05     |
|    value_loss           | 0.0877        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3197          |
|    time_elapsed         | 5836          |
|    total_timesteps      | 818432        |
| train/                  |               |
|    approx_kl            | 6.2864274e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0483        |
|    learning_rate        | 1e-06         |
|    loss                 | 576           |
|    n_updates            | 31960         |
|    policy_gradient_loss | 1.6e-07       |
|    value_loss           | 1.08e+03      |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3206          |
|    time_elapsed         | 5854          |
|    total_timesteps      | 820736        |
| train/                  |               |
|    approx_kl            | 2.7939677e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0846        |
|    learning_rate        | 1e-06         |
|    loss                 | 24.1          |
|    n_updates            | 32050         |
|    policy_gradient_loss | 1.44e-06      |
|    value_loss           | 51.5          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3216          |
|    time_elapsed         | 5872          |
|    total_timesteps      | 823296        |
| train/                  |               |
|    approx_kl            | 1.0764459e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0147        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0446        |
|    n_updates            | 32150         |
|    policy_gradient_loss | -0.000104     |
|    value_loss           | 0.0918        |
-------------------------------------------
--------------------------------------------
| rollout/                |    

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.6e+04       |
|    ep_rew_mean          | 692           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3225          |
|    time_elapsed         | 5890          |
|    total_timesteps      | 825600        |
| train/                  |               |
|    approx_kl            | 5.2852556e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0208        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0512        |
|    n_updates            | 32240         |
|    policy_gradient_loss | -6.68e-05     |
|    value_loss           | 0.113         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3234          |
|    time_elapsed         | 5907          |
|    total_timesteps      | 827904        |
| train/                  |               |
|    approx_kl            | 5.3364784e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.00399       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0406        |
|    n_updates            | 32330         |
|    policy_gradient_loss | -5.11e-05     |
|    value_loss           | 0.089         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3244          |
|    time_elapsed         | 5926          |
|    total_timesteps      | 830464        |
| train/                  |               |
|    approx_kl            | 4.0233135e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0539       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0405        |
|    n_updates            | 32430         |
|    policy_gradient_loss | -6.59e-05     |
|    value_loss           | 0.0885        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 693          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 3253         |
|    time_elapsed         | 5943         |
|    total_timesteps      | 832768       |
| train/                  |              |
|    approx_kl            | 7.893052e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.00679     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0616       |
|    n_updates            | 32520        |
|    policy_gradient_loss | -0.000723    |
|    value_loss           | 0.0938       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 693          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 3262         |
|    time_elapsed         | 5960         |
|    total_timesteps      | 835072       |
| train/                  |              |
|    approx_kl            | 9.429641e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.0982       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.1          |
|    n_updates            | 32610        |
|    policy_gradient_loss | -3.37e-05    |
|    value_loss           | 0.261        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3271          |
|    time_elapsed         | 5977          |
|    total_timesteps      | 837376        |
| train/                  |               |
|    approx_kl            | 2.9057264e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0006       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.104         |
|    n_updates            | 32700         |
|    policy_gradient_loss | -3.48e-05     |
|    value_loss           | 0.213         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.62e+04     |
|    ep_rew_mean          | 693          |
| time/                   |              |
|    fps                  | 140          |
|    iterations           | 3280         |
|    time_elapsed         | 5995         |
|    total_timesteps      | 839680       |
| train/                  |              |
|    approx_kl            | 4.172325e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.0329      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0482       |
|    n_updates            | 32790        |
|    policy_gradient_loss | -5.56e-05    |
|    value_loss           | 0.143        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3290          |
|    time_elapsed         | 6015          |
|    total_timesteps      | 842240        |
| train/                  |               |
|    approx_kl            | 4.0908344e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0264        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0434        |
|    n_updates            | 32890         |
|    policy_gradient_loss | -4.67e-05     |
|    value_loss           | 0.0848        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 140           |
|    iterations           | 3300          |
|    time_elapsed         | 6033          |
|    total_timesteps      | 844800        |
| train/                  |               |
|    approx_kl            | 3.1641684e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0504       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0376        |
|    n_updates            | 32990         |
|    policy_gradient_loss | -4.83e-05     |
|    value_loss           | 0.0964        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3309          |
|    time_elapsed         | 6050          |
|    total_timesteps      | 847104        |
| train/                  |               |
|    approx_kl            | 9.3807466e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0189        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0339        |
|    n_updates            | 33080         |
|    policy_gradient_loss | -9.85e-05     |
|    value_loss           | 0.0926        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.62e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3318          |
|    time_elapsed         | 6068          |
|    total_timesteps      | 849408        |
| train/                  |               |
|    approx_kl            | 3.5506673e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0256       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0448        |
|    n_updates            | 33170         |
|    policy_gradient_loss | -4.71e-05     |
|    value_loss           | 0.0885        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3327          |
|    time_elapsed         | 6085          |
|    total_timesteps      | 851712        |
| train/                  |               |
|    approx_kl            | 3.9720908e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.118        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0377        |
|    n_updates            | 33260         |
|    policy_gradient_loss | -7.09e-05     |
|    value_loss           | 0.0878        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3336          |
|    time_elapsed         | 6103          |
|    total_timesteps      | 854016        |
| train/                  |               |
|    approx_kl            | 6.7055225e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0678       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0544        |
|    n_updates            | 33350         |
|    policy_gradient_loss | -8.68e-05     |
|    value_loss           | 0.0906        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3345          |
|    time_elapsed         | 6120          |
|    total_timesteps      | 856320        |
| train/                  |               |
|    approx_kl            | 1.8510036e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.00355      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0396        |
|    n_updates            | 33440         |
|    policy_gradient_loss | -1.33e-05     |
|    value_loss           | 0.0878        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3354          |
|    time_elapsed         | 6137          |
|    total_timesteps      | 858624        |
| train/                  |               |
|    approx_kl            | 8.1490725e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.00361       |
|    learning_rate        | 1e-06         |
|    loss                 | 383           |
|    n_updates            | 33530         |
|    policy_gradient_loss | -5.85e-08     |
|    value_loss           | 830           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3363          |
|    time_elapsed         | 6155          |
|    total_timesteps      | 860928        |
| train/                  |               |
|    approx_kl            | 1.4947727e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.00396       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.111         |
|    n_updates            | 33620         |
|    policy_gradient_loss | -0.000528     |
|    value_loss           | 0.232         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.63e+04     |
|    ep_rew_mean          | 695          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3373         |
|    time_elapsed         | 6174         |
|    total_timesteps      | 863488       |
| train/                  |              |
|    approx_kl            | 6.684568e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.00403     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0877       |
|    n_updates            | 33720        |
|    policy_gradient_loss | -9.35e-05    |
|    value_loss           | 0.291        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3382          |
|    time_elapsed         | 6191          |
|    total_timesteps      | 865792        |
| train/                  |               |
|    approx_kl            | 3.4761615e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0307        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0392        |
|    n_updates            | 33810         |
|    policy_gradient_loss | -3.66e-05     |
|    value_loss           | 0.0978        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.63e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3391         |
|    time_elapsed         | 6207         |
|    total_timesteps      | 868096       |
| train/                  |              |
|    approx_kl            | 5.145557e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -9.23e-05    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0386       |
|    n_updates            | 33900        |
|    policy_gradient_loss | -8.22e-05    |
|    value_loss           | 0.1          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3400          |
|    time_elapsed         | 6225          |
|    total_timesteps      | 870400        |
| train/                  |               |
|    approx_kl            | 3.4831464e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0231        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.036         |
|    n_updates            | 33990         |
|    policy_gradient_loss | -2.25e-05     |
|    value_loss           | 0.0862        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.63e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3409         |
|    time_elapsed         | 6242         |
|    total_timesteps      | 872704       |
| train/                  |              |
|    approx_kl            | 8.693431e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.0961      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0468       |
|    n_updates            | 34080        |
|    policy_gradient_loss | -0.00013     |
|    value_loss           | 0.0915       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3418          |
|    time_elapsed         | 6259          |
|    total_timesteps      | 875008        |
| train/                  |               |
|    approx_kl            | 5.5879354e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0418        |
|    learning_rate        | 1e-06         |
|    loss                 | 143           |
|    n_updates            | 34170         |
|    policy_gradient_loss | -1.11e-06     |
|    value_loss           | 301           |
-------------------------------------------
--------------------------------------------
| rollout/                |    

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.63e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3427         |
|    time_elapsed         | 6276         |
|    total_timesteps      | 877312       |
| train/                  |              |
|    approx_kl            | 7.227063e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.00762     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.117        |
|    n_updates            | 34260        |
|    policy_gradient_loss | -4.61e-05    |
|    value_loss           | 0.233        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3436          |
|    time_elapsed         | 6293          |
|    total_timesteps      | 879616        |
| train/                  |               |
|    approx_kl            | 5.3155236e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.00182       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.096         |
|    n_updates            | 34350         |
|    policy_gradient_loss | -4.8e-05      |
|    value_loss           | 0.196         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3445          |
|    time_elapsed         | 6311          |
|    total_timesteps      | 881920        |
| train/                  |               |
|    approx_kl            | 7.6787546e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0376       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0471        |
|    n_updates            | 34440         |
|    policy_gradient_loss | -0.000119     |
|    value_loss           | 0.105         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.63e+04     |
|    ep_rew_mean          | 693          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3455         |
|    time_elapsed         | 6331         |
|    total_timesteps      | 884480       |
| train/                  |              |
|    approx_kl            | 3.760215e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.115        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0471       |
|    n_updates            | 34540        |
|    policy_gradient_loss | -2.9e-05     |
|    value_loss           | 0.0825       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3464          |
|    time_elapsed         | 6347          |
|    total_timesteps      | 886784        |
| train/                  |               |
|    approx_kl            | 5.6880526e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.023         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0456        |
|    n_updates            | 34630         |
|    policy_gradient_loss | -6.75e-05     |
|    value_loss           | 0.085         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3473          |
|    time_elapsed         | 6365          |
|    total_timesteps      | 889088        |
| train/                  |               |
|    approx_kl            | 1.8486753e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0344        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0373        |
|    n_updates            | 34720         |
|    policy_gradient_loss | -2.09e-05     |
|    value_loss           | 0.0852        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.63e+04     |
|    ep_rew_mean          | 693          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3482         |
|    time_elapsed         | 6382         |
|    total_timesteps      | 891392       |
| train/                  |              |
|    approx_kl            | 9.010546e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.0216       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0696       |
|    n_updates            | 34810        |
|    policy_gradient_loss | -1.51e-05    |
|    value_loss           | 0.183        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3491          |
|    time_elapsed         | 6399          |
|    total_timesteps      | 893696        |
| train/                  |               |
|    approx_kl            | 8.2841143e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.00727      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0815        |
|    n_updates            | 34900         |
|    policy_gradient_loss | -0.000111     |
|    value_loss           | 0.222         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3500          |
|    time_elapsed         | 6416          |
|    total_timesteps      | 896000        |
| train/                  |               |
|    approx_kl            | 8.1025064e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0397        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0316        |
|    n_updates            | 34990         |
|    policy_gradient_loss | -5.41e-06     |
|    value_loss           | 0.0935        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3509          |
|    time_elapsed         | 6433          |
|    total_timesteps      | 898304        |
| train/                  |               |
|    approx_kl            | 5.1092356e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.00281       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.054         |
|    n_updates            | 35080         |
|    policy_gradient_loss | -6.29e-05     |
|    value_loss           | 0.106         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3518          |
|    time_elapsed         | 6450          |
|    total_timesteps      | 900608        |
| train/                  |               |
|    approx_kl            | 4.0838495e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0241       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.039         |
|    n_updates            | 35170         |
|    policy_gradient_loss | -4.11e-05     |
|    value_loss           | 0.0887        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3527          |
|    time_elapsed         | 6467          |
|    total_timesteps      | 902912        |
| train/                  |               |
|    approx_kl            | 1.3548415e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.00334      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0387        |
|    n_updates            | 35260         |
|    policy_gradient_loss | -0.000162     |
|    value_loss           | 0.0882        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3536          |
|    time_elapsed         | 6484          |
|    total_timesteps      | 905216        |
| train/                  |               |
|    approx_kl            | 1.8673018e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.00444       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.082         |
|    n_updates            | 35350         |
|    policy_gradient_loss | -3.72e-05     |
|    value_loss           | 0.22          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3545          |
|    time_elapsed         | 6501          |
|    total_timesteps      | 907520        |
| train/                  |               |
|    approx_kl            | 3.7720893e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.000873      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.133         |
|    n_updates            | 35440         |
|    policy_gradient_loss | -8.69e-05     |
|    value_loss           | 0.248         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3554          |
|    time_elapsed         | 6518          |
|    total_timesteps      | 909824        |
| train/                  |               |
|    approx_kl            | 4.7590584e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.000729      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0456        |
|    n_updates            | 35530         |
|    policy_gradient_loss | -3.67e-05     |
|    value_loss           | 0.0894        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3563          |
|    time_elapsed         | 6536          |
|    total_timesteps      | 912128        |
| train/                  |               |
|    approx_kl            | 1.0496005e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.14         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0365        |
|    n_updates            | 35620         |
|    policy_gradient_loss | -7.77e-05     |
|    value_loss           | 0.0923        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.63e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3572          |
|    time_elapsed         | 6553          |
|    total_timesteps      | 914432        |
| train/                  |               |
|    approx_kl            | 3.9534643e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0746       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0476        |
|    n_updates            | 35710         |
|    policy_gradient_loss | -2.6e-05      |
|    value_loss           | 0.0965        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.63e+04     |
|    ep_rew_mean          | 697          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3581         |
|    time_elapsed         | 6570         |
|    total_timesteps      | 916736       |
| train/                  |              |
|    approx_kl            | 7.543713e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.00114     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0441       |
|    n_updates            | 35800        |
|    policy_gradient_loss | -4.64e-06    |
|    value_loss           | 0.0861       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3590          |
|    time_elapsed         | 6587          |
|    total_timesteps      | 919040        |
| train/                  |               |
|    approx_kl            | 3.8114376e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.00678      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0676        |
|    n_updates            | 35890         |
|    policy_gradient_loss | -5.19e-05     |
|    value_loss           | 0.107         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3599          |
|    time_elapsed         | 6605          |
|    total_timesteps      | 921344        |
| train/                  |               |
|    approx_kl            | 1.0151416e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0299        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0525        |
|    n_updates            | 35980         |
|    policy_gradient_loss | -1.12e-05     |
|    value_loss           | 0.0875        |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.64e+04    |
|    ep_rew_mean          | 696         |
| time/                   |             |
|    fps                  | 139         |
|    iterations           | 3608        |
|    time_elapsed         | 6622        |
|    total_timesteps      | 923648      |
| train/                  |             |
|    approx_kl            | 3.17581e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.86       |
|    explained_variance   | 0.0678      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0404      |
|    n_updates            | 36070       |
|    policy_gradient_loss | -2.32e-05   |
|    value_loss           | 0.0868      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3617          |
|    time_elapsed         | 6639          |
|    total_timesteps      | 925952        |
| train/                  |               |
|    approx_kl            | 7.8161247e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.0184       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0413        |
|    n_updates            | 36160         |
|    policy_gradient_loss | -8.05e-05     |
|    value_loss           | 0.0881        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3626          |
|    time_elapsed         | 6656          |
|    total_timesteps      | 928256        |
| train/                  |               |
|    approx_kl            | 1.1944212e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0526        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0717        |
|    n_updates            | 36250         |
|    policy_gradient_loss | -2.55e-05     |
|    value_loss           | 0.199         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3635          |
|    time_elapsed         | 6674          |
|    total_timesteps      | 930560        |
| train/                  |               |
|    approx_kl            | 2.5634654e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.00933       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.144         |
|    n_updates            | 36340         |
|    policy_gradient_loss | -3.15e-05     |
|    value_loss           | 0.262         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3644          |
|    time_elapsed         | 6692          |
|    total_timesteps      | 932864        |
| train/                  |               |
|    approx_kl            | 1.4156103e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | 0.0233        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.047         |
|    n_updates            | 36430         |
|    policy_gradient_loss | -1.47e-05     |
|    value_loss           | 0.11          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3653         |
|    time_elapsed         | 6709         |
|    total_timesteps      | 935168       |
| train/                  |              |
|    approx_kl            | 5.043112e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | -0.00767     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0577       |
|    n_updates            | 36520        |
|    policy_gradient_loss | -7.1e-05     |
|    value_loss           | 0.107        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3662          |
|    time_elapsed         | 6726          |
|    total_timesteps      | 937472        |
| train/                  |               |
|    approx_kl            | 2.7753413e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.113         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0378        |
|    n_updates            | 36610         |
|    policy_gradient_loss | -3.49e-05     |
|    value_loss           | 0.0773        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3671          |
|    time_elapsed         | 6743          |
|    total_timesteps      | 939776        |
| train/                  |               |
|    approx_kl            | 1.2742821e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.122        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0423        |
|    n_updates            | 36700         |
|    policy_gradient_loss | -3.37e-05     |
|    value_loss           | 0.106         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3680         |
|    time_elapsed         | 6760         |
|    total_timesteps      | 942080       |
| train/                  |              |
|    approx_kl            | 4.975591e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.87        |
|    explained_variance   | 0.000148     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0428       |
|    n_updates            | 36790        |
|    policy_gradient_loss | -5.02e-05    |
|    value_loss           | 0.0882       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3689         |
|    time_elapsed         | 6777         |
|    total_timesteps      | 944384       |
| train/                  |              |
|    approx_kl            | 2.847053e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | -0.397       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0669       |
|    n_updates            | 36880        |
|    policy_gradient_loss | -8.2e-05     |
|    value_loss           | 0.141        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3698          |
|    time_elapsed         | 6794          |
|    total_timesteps      | 946688        |
| train/                  |               |
|    approx_kl            | 1.3627578e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.000292      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0454        |
|    n_updates            | 36970         |
|    policy_gradient_loss | -0.000116     |
|    value_loss           | 0.0972        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3707          |
|    time_elapsed         | 6811          |
|    total_timesteps      | 948992        |
| train/                  |               |
|    approx_kl            | 1.3525132e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0192        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0443        |
|    n_updates            | 37060         |
|    policy_gradient_loss | -0.000165     |
|    value_loss           | 0.0893        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3717          |
|    time_elapsed         | 6831          |
|    total_timesteps      | 951552        |
| train/                  |               |
|    approx_kl            | 4.4633634e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.024        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0424        |
|    n_updates            | 37160         |
|    policy_gradient_loss | -6.85e-05     |
|    value_loss           | 0.0911        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3726          |
|    time_elapsed         | 6848          |
|    total_timesteps      | 953856        |
| train/                  |               |
|    approx_kl            | 1.0866206e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.0472       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0956        |
|    n_updates            | 37250         |
|    policy_gradient_loss | -0.000136     |
|    value_loss           | 0.218         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3735          |
|    time_elapsed         | 6865          |
|    total_timesteps      | 956160        |
| train/                  |               |
|    approx_kl            | 1.0244548e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.104         |
|    learning_rate        | 1e-06         |
|    loss                 | 80.2          |
|    n_updates            | 37340         |
|    policy_gradient_loss | -5.68e-06     |
|    value_loss           | 113           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3744         |
|    time_elapsed         | 6882         |
|    total_timesteps      | 958464       |
| train/                  |              |
|    approx_kl            | 9.613577e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.0276       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0532       |
|    n_updates            | 37430        |
|    policy_gradient_loss | -0.000119    |
|    value_loss           | 0.0987       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 701           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3753          |
|    time_elapsed         | 6900          |
|    total_timesteps      | 960768        |
| train/                  |               |
|    approx_kl            | 4.5844354e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0424        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0376        |
|    n_updates            | 37520         |
|    policy_gradient_loss | -5.66e-05     |
|    value_loss           | 0.0961        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 701           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3762          |
|    time_elapsed         | 6917          |
|    total_timesteps      | 963072        |
| train/                  |               |
|    approx_kl            | 3.5879202e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0376        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0503        |
|    n_updates            | 37610         |
|    policy_gradient_loss | -5.93e-05     |
|    value_loss           | 0.095         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 701           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3771          |
|    time_elapsed         | 6934          |
|    total_timesteps      | 965376        |
| train/                  |               |
|    approx_kl            | 1.3788231e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0022        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0397        |
|    n_updates            | 37700         |
|    policy_gradient_loss | -0.000139     |
|    value_loss           | 0.0884        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 701           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3780          |
|    time_elapsed         | 6950          |
|    total_timesteps      | 967680        |
| train/                  |               |
|    approx_kl            | 1.9883737e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0237        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.115         |
|    n_updates            | 37790         |
|    policy_gradient_loss | -2.84e-05     |
|    value_loss           | 0.2           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 701           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3789          |
|    time_elapsed         | 6967          |
|    total_timesteps      | 969984        |
| train/                  |               |
|    approx_kl            | 3.7625432e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.00676       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.133         |
|    n_updates            | 37880         |
|    policy_gradient_loss | -5e-05        |
|    value_loss           | 0.252         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 701          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3799         |
|    time_elapsed         | 6987         |
|    total_timesteps      | 972544       |
| train/                  |              |
|    approx_kl            | 4.353933e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.000891     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0982       |
|    n_updates            | 37980        |
|    policy_gradient_loss | -3.72e-05    |
|    value_loss           | 0.205        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 701           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3808          |
|    time_elapsed         | 7004          |
|    total_timesteps      | 974848        |
| train/                  |               |
|    approx_kl            | 2.4959445e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.0251       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.043         |
|    n_updates            | 38070         |
|    policy_gradient_loss | -2.21e-05     |
|    value_loss           | 0.0867        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 698          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3817         |
|    time_elapsed         | 7021         |
|    total_timesteps      | 977152       |
| train/                  |              |
|    approx_kl            | 1.839362e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.0855       |
|    learning_rate        | 1e-06        |
|    loss                 | 46.8         |
|    n_updates            | 38160        |
|    policy_gradient_loss | -6.18e-06    |
|    value_loss           | 72           |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3826          |
|    time_elapsed         | 7038          |
|    total_timesteps      | 979456        |
| train/                  |               |
|    approx_kl            | 5.3225085e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.00721      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0433        |
|    n_updates            | 38250         |
|    policy_gradient_loss | -6.88e-05     |
|    value_loss           | 0.0922        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3835          |
|    time_elapsed         | 7056          |
|    total_timesteps      | 981760        |
| train/                  |               |
|    approx_kl            | 6.1774626e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.000399      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0437        |
|    n_updates            | 38340         |
|    policy_gradient_loss | -0.000261     |
|    value_loss           | 0.0943        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 698          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3844         |
|    time_elapsed         | 7073         |
|    total_timesteps      | 984064       |
| train/                  |              |
|    approx_kl            | 8.100178e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.173        |
|    learning_rate        | 1e-06        |
|    loss                 | 98.9         |
|    n_updates            | 38430        |
|    policy_gradient_loss | 4.07e-05     |
|    value_loss           | 190          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 698          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 3853         |
|    time_elapsed         | 7090         |
|    total_timesteps      | 986368       |
| train/                  |              |
|    approx_kl            | 8.381903e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.108        |
|    learning_rate        | 1e-06        |
|    loss                 | 95.4         |
|    n_updates            | 38520        |
|    policy_gradient_loss | -3.01e-06    |
|    value_loss           | 169          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3862          |
|    time_elapsed         | 7107          |
|    total_timesteps      | 988672        |
| train/                  |               |
|    approx_kl            | 2.9597897e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.00833      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.114         |
|    n_updates            | 38610         |
|    policy_gradient_loss | -0.00016      |
|    value_loss           | 0.215         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3871          |
|    time_elapsed         | 7124          |
|    total_timesteps      | 990976        |
| train/                  |               |
|    approx_kl            | 7.0780516e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.0355       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0421        |
|    n_updates            | 38700         |
|    policy_gradient_loss | -5.92e-05     |
|    value_loss           | 0.0903        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3880          |
|    time_elapsed         | 7141          |
|    total_timesteps      | 993280        |
| train/                  |               |
|    approx_kl            | 4.6077184e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.022        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0516        |
|    n_updates            | 38790         |
|    policy_gradient_loss | -4.81e-05     |
|    value_loss           | 0.0961        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3889          |
|    time_elapsed         | 7158          |
|    total_timesteps      | 995584        |
| train/                  |               |
|    approx_kl            | 3.5602134e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.187        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0445        |
|    n_updates            | 38880         |
|    policy_gradient_loss | -9.98e-05     |
|    value_loss           | 0.0925        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3898          |
|    time_elapsed         | 7175          |
|    total_timesteps      | 997888        |
| train/                  |               |
|    approx_kl            | 6.0882885e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.000505      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0414        |
|    n_updates            | 38970         |
|    policy_gradient_loss | -0.000209     |
|    value_loss           | 0.0901        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3907          |
|    time_elapsed         | 7192          |
|    total_timesteps      | 1000192       |
| train/                  |               |
|    approx_kl            | 3.9115548e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0935        |
|    learning_rate        | 1e-06         |
|    loss                 | 347           |
|    n_updates            | 39060         |
|    policy_gradient_loss | -9.34e-06     |
|    value_loss           | 960           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3916          |
|    time_elapsed         | 7209          |
|    total_timesteps      | 1002496       |
| train/                  |               |
|    approx_kl            | 1.1096708e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 6.74e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0975        |
|    n_updates            | 39150         |
|    policy_gradient_loss | -0.000147     |
|    value_loss           | 0.247         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3925          |
|    time_elapsed         | 7226          |
|    total_timesteps      | 1004800       |
| train/                  |               |
|    approx_kl            | 5.2317046e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 8.31e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0911        |
|    n_updates            | 39240         |
|    policy_gradient_loss | -7.2e-05      |
|    value_loss           | 0.227         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3934          |
|    time_elapsed         | 7242          |
|    total_timesteps      | 1007104       |
| train/                  |               |
|    approx_kl            | 3.3993274e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -5.07e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0765        |
|    n_updates            | 39330         |
|    policy_gradient_loss | 1.5e-06       |
|    value_loss           | 0.159         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3943          |
|    time_elapsed         | 7259          |
|    total_timesteps      | 1009408       |
| train/                  |               |
|    approx_kl            | 4.6612695e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.000335      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.039         |
|    n_updates            | 39420         |
|    policy_gradient_loss | -4.77e-05     |
|    value_loss           | 0.0906        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3952          |
|    time_elapsed         | 7276          |
|    total_timesteps      | 1011712       |
| train/                  |               |
|    approx_kl            | 2.6565976e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.0806       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0489        |
|    n_updates            | 39510         |
|    policy_gradient_loss | -2.62e-05     |
|    value_loss           | 0.102         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 700           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3961          |
|    time_elapsed         | 7293          |
|    total_timesteps      | 1014016       |
| train/                  |               |
|    approx_kl            | 1.2130477e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.00373       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0481        |
|    n_updates            | 39600         |
|    policy_gradient_loss | -3.22e-05     |
|    value_loss           | 0.119         |
-------------------------------------------
------------------------------------------
| rollout/                |      

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.66e+04   |
|    ep_rew_mean          | 700        |
| time/                   |            |
|    fps                  | 139        |
|    iterations           | 3970       |
|    time_elapsed         | 7310       |
|    total_timesteps      | 1016320    |
| train/                  |            |
|    approx_kl            | 2.8871e-07 |
|    clip_fraction        | 0          |
|    clip_range           | 0.2        |
|    entropy_loss         | -1.86      |
|    explained_variance   | -0.0526    |
|    learning_rate        | 1e-06      |
|    loss                 | 0.0473     |
|    n_updates            | 39690      |
|    policy_gradient_loss | -3.31e-05  |
|    value_loss           | 0.0931     |
----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 700           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 3980          |
|    time_elapsed         | 7329          |
|    total_timesteps      | 1018880       |
| train/                  |               |
|    approx_kl            | 7.8231096e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.146         |
|    learning_rate        | 1e-06         |
|    loss                 | 70.6          |
|    n_updates            | 39790         |
|    policy_gradient_loss | 1.06e-05      |
|    value_loss           | 138           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 700           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 3989          |
|    time_elapsed         | 7346          |
|    total_timesteps      | 1021184       |
| train/                  |               |
|    approx_kl            | 5.2480027e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.00354       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0417        |
|    n_updates            | 39880         |
|    policy_gradient_loss | -3.92e-05     |
|    value_loss           | 0.0879        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 700          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 3998         |
|    time_elapsed         | 7363         |
|    total_timesteps      | 1023488      |
| train/                  |              |
|    approx_kl            | 7.003546e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | -8.25e-05    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.116        |
|    n_updates            | 39970        |
|    policy_gradient_loss | -0.000125    |
|    value_loss           | 0.245        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 700          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4007         |
|    time_elapsed         | 7380         |
|    total_timesteps      | 1025792      |
| train/                  |              |
|    approx_kl            | 4.172325e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | -0.00637     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.122        |
|    n_updates            | 40060        |
|    policy_gradient_loss | -3.7e-05     |
|    value_loss           | 0.213        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 700          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4017         |
|    time_elapsed         | 7398         |
|    total_timesteps      | 1028352      |
| train/                  |              |
|    approx_kl            | 5.355105e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | -0.0233      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0389       |
|    n_updates            | 40160        |
|    policy_gradient_loss | -3.97e-05    |
|    value_loss           | 0.0887       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 700           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4026          |
|    time_elapsed         | 7416          |
|    total_timesteps      | 1030656       |
| train/                  |               |
|    approx_kl            | 4.5076013e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.0373       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0438        |
|    n_updates            | 40250         |
|    policy_gradient_loss | -5.06e-05     |
|    value_loss           | 0.0912        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 700           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4035          |
|    time_elapsed         | 7432          |
|    total_timesteps      | 1032960       |
| train/                  |               |
|    approx_kl            | 2.8242357e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.00198      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0503        |
|    n_updates            | 40340         |
|    policy_gradient_loss | -3.63e-05     |
|    value_loss           | 0.0907        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 700           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4044          |
|    time_elapsed         | 7449          |
|    total_timesteps      | 1035264       |
| train/                  |               |
|    approx_kl            | 4.4563785e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.00375      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0488        |
|    n_updates            | 40430         |
|    policy_gradient_loss | -4.1e-05      |
|    value_loss           | 0.0922        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 697          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4053         |
|    time_elapsed         | 7466         |
|    total_timesteps      | 1037568      |
| train/                  |              |
|    approx_kl            | 8.312054e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.0774       |
|    learning_rate        | 1e-06        |
|    loss                 | 465          |
|    n_updates            | 40520        |
|    policy_gradient_loss | 1.79e-05     |
|    value_loss           | 856          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4062          |
|    time_elapsed         | 7482          |
|    total_timesteps      | 1039872       |
| train/                  |               |
|    approx_kl            | 7.4054115e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.00287      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0323        |
|    n_updates            | 40610         |
|    policy_gradient_loss | -0.000147     |
|    value_loss           | 0.0884        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4071          |
|    time_elapsed         | 7500          |
|    total_timesteps      | 1042176       |
| train/                  |               |
|    approx_kl            | 1.1133961e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.000153      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0445        |
|    n_updates            | 40700         |
|    policy_gradient_loss | -0.000141     |
|    value_loss           | 0.0937        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4080          |
|    time_elapsed         | 7517          |
|    total_timesteps      | 1044480       |
| train/                  |               |
|    approx_kl            | 2.3236498e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.000572      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0594        |
|    n_updates            | 40790         |
|    policy_gradient_loss | -4.78e-05     |
|    value_loss           | 0.108         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4089          |
|    time_elapsed         | 7533          |
|    total_timesteps      | 1046784       |
| train/                  |               |
|    approx_kl            | 1.0011718e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.151         |
|    learning_rate        | 1e-06         |
|    loss                 | 93.7          |
|    n_updates            | 40880         |
|    policy_gradient_loss | -2.17e-07     |
|    value_loss           | 163           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4098          |
|    time_elapsed         | 7550          |
|    total_timesteps      | 1049088       |
| train/                  |               |
|    approx_kl            | 1.3574027e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.00195       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0953        |
|    n_updates            | 40970         |
|    policy_gradient_loss | -1.43e-05     |
|    value_loss           | 0.241         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 697          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4107         |
|    time_elapsed         | 7568         |
|    total_timesteps      | 1051392      |
| train/                  |              |
|    approx_kl            | 6.065238e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.00269      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0387       |
|    n_updates            | 41060        |
|    policy_gradient_loss | -7e-05       |
|    value_loss           | 0.0863       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

--------------------------------------------
| rollout/                |                |
|    ep_len_mean          | 1.67e+04       |
|    ep_rew_mean          | 697            |
| time/                   |                |
|    fps                  | 138            |
|    iterations           | 4116           |
|    time_elapsed         | 7585           |
|    total_timesteps      | 1053696        |
| train/                  |                |
|    approx_kl            | 1.21071935e-08 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -1.86          |
|    explained_variance   | 0.00829        |
|    learning_rate        | 1e-06          |
|    loss                 | 319            |
|    n_updates            | 41150          |
|    policy_gradient_loss | 1.74e-07       |
|    value_loss           | 646            |
--------------------------------------------
-------------------------------------------
| rollout/ 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4125          |
|    time_elapsed         | 7602          |
|    total_timesteps      | 1056000       |
| train/                  |               |
|    approx_kl            | 3.3085234e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.00352       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.05          |
|    n_updates            | 41240         |
|    policy_gradient_loss | -6.54e-05     |
|    value_loss           | 0.0988        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4134          |
|    time_elapsed         | 7619          |
|    total_timesteps      | 1058304       |
| train/                  |               |
|    approx_kl            | 2.2700988e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0863        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0346        |
|    n_updates            | 41330         |
|    policy_gradient_loss | -4.6e-05      |
|    value_loss           | 0.0892        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 697           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4143          |
|    time_elapsed         | 7637          |
|    total_timesteps      | 1060608       |
| train/                  |               |
|    approx_kl            | 5.3085387e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0575        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0419        |
|    n_updates            | 41420         |
|    policy_gradient_loss | -6.74e-05     |
|    value_loss           | 0.0849        |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4152          |
|    time_elapsed         | 7652          |
|    total_timesteps      | 1062912       |
| train/                  |               |
|    approx_kl            | 1.9976869e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.132        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0586        |
|    n_updates            | 41510         |
|    policy_gradient_loss | -3e-05        |
|    value_loss           | 0.108         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4161          |
|    time_elapsed         | 7668          |
|    total_timesteps      | 1065216       |
| train/                  |               |
|    approx_kl            | 6.9476664e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.105        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.043         |
|    n_updates            | 41600         |
|    policy_gradient_loss | -7.4e-05      |
|    value_loss           | 0.108         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.68e+04    |
|    ep_rew_mean          | 695         |
| time/                   |             |
|    fps                  | 138         |
|    iterations           | 4170        |
|    time_elapsed         | 7684        |
|    total_timesteps      | 1067520     |
| train/                  |             |
|    approx_kl            | 7.62986e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.86       |
|    explained_variance   | -0.0438     |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0431      |
|    n_updates            | 41690       |
|    policy_gradient_loss | -8.89e-05   |
|    value_loss           | 0.0893      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4180          |
|    time_elapsed         | 7704          |
|    total_timesteps      | 1070080       |
| train/                  |               |
|    approx_kl            | 1.0477379e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.147         |
|    learning_rate        | 1e-06         |
|    loss                 | 27.2          |
|    n_updates            | 41790         |
|    policy_gradient_loss | -2.92e-06     |
|    value_loss           | 55            |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4189          |
|    time_elapsed         | 7721          |
|    total_timesteps      | 1072384       |
| train/                  |               |
|    approx_kl            | 1.9860454e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.00152       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.119         |
|    n_updates            | 41880         |
|    policy_gradient_loss | -1.04e-05     |
|    value_loss           | 0.226         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 695          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4198         |
|    time_elapsed         | 7738         |
|    total_timesteps      | 1074688      |
| train/                  |              |
|    approx_kl            | 4.156027e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.0111       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.126        |
|    n_updates            | 41970        |
|    policy_gradient_loss | -5.78e-05    |
|    value_loss           | 0.214        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 695          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4208         |
|    time_elapsed         | 7756         |
|    total_timesteps      | 1077248      |
| train/                  |              |
|    approx_kl            | 3.192108e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0556      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.036        |
|    n_updates            | 42070        |
|    policy_gradient_loss | -3.61e-05    |
|    value_loss           | 0.0852       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 695          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4217         |
|    time_elapsed         | 7773         |
|    total_timesteps      | 1079552      |
| train/                  |              |
|    approx_kl            | 9.778887e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.000373     |
|    learning_rate        | 1e-06        |
|    loss                 | 100          |
|    n_updates            | 42160        |
|    policy_gradient_loss | -1.31e-06    |
|    value_loss           | 282          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 695          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4226         |
|    time_elapsed         | 7790         |
|    total_timesteps      | 1081856      |
| train/                  |              |
|    approx_kl            | 3.787456e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | -0.00355     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0374       |
|    n_updates            | 42250        |
|    policy_gradient_loss | -0.000141    |
|    value_loss           | 0.0992       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4236          |
|    time_elapsed         | 7807          |
|    total_timesteps      | 1084416       |
| train/                  |               |
|    approx_kl            | 8.1094913e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.000414      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0388        |
|    n_updates            | 42350         |
|    policy_gradient_loss | -5.91e-05     |
|    value_loss           | 0.0881        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4245          |
|    time_elapsed         | 7823          |
|    total_timesteps      | 1086720       |
| train/                  |               |
|    approx_kl            | 2.7776696e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.00241       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.119         |
|    n_updates            | 42440         |
|    policy_gradient_loss | -4.21e-05     |
|    value_loss           | 0.265         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4254          |
|    time_elapsed         | 7839          |
|    total_timesteps      | 1089024       |
| train/                  |               |
|    approx_kl            | 2.2584572e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.00807       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0998        |
|    n_updates            | 42530         |
|    policy_gradient_loss | -2.33e-05     |
|    value_loss           | 0.221         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 695           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4263          |
|    time_elapsed         | 7855          |
|    total_timesteps      | 1091328       |
| train/                  |               |
|    approx_kl            | 6.1118044e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0048        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0425        |
|    n_updates            | 42620         |
|    policy_gradient_loss | -8.64e-05     |
|    value_loss           | 0.103         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 695          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4272         |
|    time_elapsed         | 7871         |
|    total_timesteps      | 1093632      |
| train/                  |              |
|    approx_kl            | 7.371418e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | -0.000167    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0673       |
|    n_updates            | 42710        |
|    policy_gradient_loss | -9.3e-05     |
|    value_loss           | 0.127        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4281          |
|    time_elapsed         | 7887          |
|    total_timesteps      | 1095936       |
| train/                  |               |
|    approx_kl            | 1.6554259e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.393         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.185         |
|    n_updates            | 42800         |
|    policy_gradient_loss | -3.11e-05     |
|    value_loss           | 1.32          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 698           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4290          |
|    time_elapsed         | 7902          |
|    total_timesteps      | 1098240       |
| train/                  |               |
|    approx_kl            | 4.8428774e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.219         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0455        |
|    n_updates            | 42890         |
|    policy_gradient_loss | -1.06e-05     |
|    value_loss           | 0.073         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 698          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4299         |
|    time_elapsed         | 7919         |
|    total_timesteps      | 1100544      |
| train/                  |              |
|    approx_kl            | 4.270114e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.0262       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0526       |
|    n_updates            | 42980        |
|    policy_gradient_loss | -6.1e-05     |
|    value_loss           | 0.0936       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 698          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4309         |
|    time_elapsed         | 7937         |
|    total_timesteps      | 1103104      |
| train/                  |              |
|    approx_kl            | 5.378388e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.0245       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.034        |
|    n_updates            | 43080        |
|    policy_gradient_loss | -5.83e-05    |
|    value_loss           | 0.0867       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 699           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4318          |
|    time_elapsed         | 7952          |
|    total_timesteps      | 1105408       |
| train/                  |               |
|    approx_kl            | 1.4551915e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0139        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0598        |
|    n_updates            | 43170         |
|    policy_gradient_loss | -2.03e-05     |
|    value_loss           | 0.123         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 699           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4327          |
|    time_elapsed         | 7968          |
|    total_timesteps      | 1107712       |
| train/                  |               |
|    approx_kl            | 4.9360096e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0255        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0384        |
|    n_updates            | 43260         |
|    policy_gradient_loss | -7.1e-05      |
|    value_loss           | 0.0847        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 699           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4336          |
|    time_elapsed         | 7985          |
|    total_timesteps      | 1110016       |
| train/                  |               |
|    approx_kl            | 3.0221418e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.000278     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0471        |
|    n_updates            | 43350         |
|    policy_gradient_loss | -2.5e-05      |
|    value_loss           | 0.0893        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 699           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4345          |
|    time_elapsed         | 8000          |
|    total_timesteps      | 1112320       |
| train/                  |               |
|    approx_kl            | 7.0547685e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.0751       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0919        |
|    n_updates            | 43440         |
|    policy_gradient_loss | -1.37e-05     |
|    value_loss           | 0.207         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 699           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4354          |
|    time_elapsed         | 8016          |
|    total_timesteps      | 1114624       |
| train/                  |               |
|    approx_kl            | 1.6693957e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.0365        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.173         |
|    n_updates            | 43530         |
|    policy_gradient_loss | -4.17e-05     |
|    value_loss           | 0.341         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 699           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4363          |
|    time_elapsed         | 8032          |
|    total_timesteps      | 1116928       |
| train/                  |               |
|    approx_kl            | 5.2852556e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.0848       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0842        |
|    n_updates            | 43620         |
|    policy_gradient_loss | -1.67e-06     |
|    value_loss           | 0.174         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 699           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4372          |
|    time_elapsed         | 8048          |
|    total_timesteps      | 1119232       |
| train/                  |               |
|    approx_kl            | 3.3830293e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.0249       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0633        |
|    n_updates            | 43710         |
|    policy_gradient_loss | -6.44e-05     |
|    value_loss           | 0.0967        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 4381         |
|    time_elapsed         | 8065         |
|    total_timesteps      | 1121536      |
| train/                  |              |
|    approx_kl            | 6.861519e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.103        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0556       |
|    n_updates            | 43800        |
|    policy_gradient_loss | -8.69e-05    |
|    value_loss           | 0.0925       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.67e+04    |
|    ep_rew_mean          | 696         |
| time/                   |             |
|    fps                  | 139         |
|    iterations           | 4390        |
|    time_elapsed         | 8081        |
|    total_timesteps      | 1123840     |
| train/                  |             |
|    approx_kl            | 6.67735e-06 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.86       |
|    explained_variance   | -0.245      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0516      |
|    n_updates            | 43890       |
|    policy_gradient_loss | -0.000171   |
|    value_loss           | 0.104       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 4399         |
|    time_elapsed         | 8096         |
|    total_timesteps      | 1126144      |
| train/                  |              |
|    approx_kl            | 1.071021e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.212        |
|    learning_rate        | 1e-06        |
|    loss                 | 46.9         |
|    n_updates            | 43980        |
|    policy_gradient_loss | -1.69e-06    |
|    value_loss           | 96           |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4408          |
|    time_elapsed         | 8112          |
|    total_timesteps      | 1128448       |
| train/                  |               |
|    approx_kl            | 1.1650845e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.007         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0767        |
|    n_updates            | 44070         |
|    policy_gradient_loss | -3.37e-05     |
|    value_loss           | 0.202         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 4417         |
|    time_elapsed         | 8129         |
|    total_timesteps      | 1130752      |
| train/                  |              |
|    approx_kl            | 8.195639e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.86        |
|    explained_variance   | 0.0644       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.138        |
|    n_updates            | 44160        |
|    policy_gradient_loss | -3.99e-06    |
|    value_loss           | 0.23         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 696           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4426          |
|    time_elapsed         | 8146          |
|    total_timesteps      | 1133056       |
| train/                  |               |
|    approx_kl            | 4.3492764e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0442        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0611        |
|    n_updates            | 44250         |
|    policy_gradient_loss | -6.38e-05     |
|    value_loss           | 0.133         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 696          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 4435         |
|    time_elapsed         | 8163         |
|    total_timesteps      | 1135360      |
| train/                  |              |
|    approx_kl            | 5.757902e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.000201    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0492       |
|    n_updates            | 44340        |
|    policy_gradient_loss | -4.06e-05    |
|    value_loss           | 0.101        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 693          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 4444         |
|    time_elapsed         | 8181         |
|    total_timesteps      | 1137664      |
| train/                  |              |
|    approx_kl            | 1.557637e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.00892      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0465       |
|    n_updates            | 44430        |
|    policy_gradient_loss | -1.67e-05    |
|    value_loss           | 0.12         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4453          |
|    time_elapsed         | 8198          |
|    total_timesteps      | 1139968       |
| train/                  |               |
|    approx_kl            | 5.6577846e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0117        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0436        |
|    n_updates            | 44520         |
|    policy_gradient_loss | -9.25e-05     |
|    value_loss           | 0.0982        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 693           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4462          |
|    time_elapsed         | 8216          |
|    total_timesteps      | 1142272       |
| train/                  |               |
|    approx_kl            | 1.3584038e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0611       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0418        |
|    n_updates            | 44610         |
|    policy_gradient_loss | -0.000143     |
|    value_loss           | 0.0887        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 703          |
| time/                   |              |
|    fps                  | 139          |
|    iterations           | 4471         |
|    time_elapsed         | 8233         |
|    total_timesteps      | 1144576      |
| train/                  |              |
|    approx_kl            | 5.122274e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.000967     |
|    learning_rate        | 1e-06        |
|    loss                 | 365          |
|    n_updates            | 44700        |
|    policy_gradient_loss | -4.16e-07    |
|    value_loss           | 799          |
------------------------------------------
--------------------------------------------
| rollout/                |                |
|    ep

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 703           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4480          |
|    time_elapsed         | 8250          |
|    total_timesteps      | 1146880       |
| train/                  |               |
|    approx_kl            | 2.4144538e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.000336     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0506        |
|    n_updates            | 44790         |
|    policy_gradient_loss | -2.41e-05     |
|    value_loss           | 0.123         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 703           |
| time/                   |               |
|    fps                  | 139           |
|    iterations           | 4489          |
|    time_elapsed         | 8267          |
|    total_timesteps      | 1149184       |
| train/                  |               |
|    approx_kl            | 1.4784746e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.00124      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0585        |
|    n_updates            | 44880         |
|    policy_gradient_loss | -1.11e-05     |
|    value_loss           | 0.0955        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 703          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4499         |
|    time_elapsed         | 8287         |
|    total_timesteps      | 1151744      |
| train/                  |              |
|    approx_kl            | 3.047753e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0025       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0522       |
|    n_updates            | 44980        |
|    policy_gradient_loss | -2.57e-05    |
|    value_loss           | 0.106        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 703           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4508          |
|    time_elapsed         | 8304          |
|    total_timesteps      | 1154048       |
| train/                  |               |
|    approx_kl            | 3.4319237e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.00894      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.129         |
|    n_updates            | 45070         |
|    policy_gradient_loss | -5.1e-05      |
|    value_loss           | 0.282         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 703          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4517         |
|    time_elapsed         | 8321         |
|    total_timesteps      | 1156352      |
| train/                  |              |
|    approx_kl            | 1.610443e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.00846     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.107        |
|    n_updates            | 45160        |
|    policy_gradient_loss | -9.57e-05    |
|    value_loss           | 0.223        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 703           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4527          |
|    time_elapsed         | 8340          |
|    total_timesteps      | 1158912       |
| train/                  |               |
|    approx_kl            | 4.4121407e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.16         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.065         |
|    n_updates            | 45260         |
|    policy_gradient_loss | -4.18e-05     |
|    value_loss           | 0.114         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 703          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4537         |
|    time_elapsed         | 8359         |
|    total_timesteps      | 1161472      |
| train/                  |              |
|    approx_kl            | 2.195593e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.183       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0415       |
|    n_updates            | 45360        |
|    policy_gradient_loss | -4.61e-05    |
|    value_loss           | 0.0963       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 703          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4546         |
|    time_elapsed         | 8376         |
|    total_timesteps      | 1163776      |
| train/                  |              |
|    approx_kl            | 6.335322e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.00101      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0464       |
|    n_updates            | 45450        |
|    policy_gradient_loss | -6.15e-05    |
|    value_loss           | 0.0935       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 703          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4555         |
|    time_elapsed         | 8393         |
|    total_timesteps      | 1166080      |
| train/                  |              |
|    approx_kl            | 5.280599e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.1         |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0452       |
|    n_updates            | 45540        |
|    policy_gradient_loss | -6.29e-05    |
|    value_loss           | 0.0935       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 702          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4564         |
|    time_elapsed         | 8410         |
|    total_timesteps      | 1168384      |
| train/                  |              |
|    approx_kl            | 6.216578e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.000168    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.461        |
|    n_updates            | 45630        |
|    policy_gradient_loss | -1.14e-05    |
|    value_loss           | 0.947        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 702           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4573          |
|    time_elapsed         | 8428          |
|    total_timesteps      | 1170688       |
| train/                  |               |
|    approx_kl            | 2.6868656e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0202       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0397        |
|    n_updates            | 45720         |
|    policy_gradient_loss | -3.63e-05     |
|    value_loss           | 0.0998        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 702          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4582         |
|    time_elapsed         | 8445         |
|    total_timesteps      | 1172992      |
| train/                  |              |
|    approx_kl            | 3.692694e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0041      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0408       |
|    n_updates            | 45810        |
|    policy_gradient_loss | -3.76e-05    |
|    value_loss           | 0.0883       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 702           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4592          |
|    time_elapsed         | 8464          |
|    total_timesteps      | 1175552       |
| train/                  |               |
|    approx_kl            | 3.2177195e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.00221       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0444        |
|    n_updates            | 45910         |
|    policy_gradient_loss | -4.27e-05     |
|    value_loss           | 0.0871        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

--------------------------------------------
| rollout/                |                |
|    ep_len_mean          | 1.67e+04       |
|    ep_rew_mean          | 702            |
| time/                   |                |
|    fps                  | 138            |
|    iterations           | 4601           |
|    time_elapsed         | 8481           |
|    total_timesteps      | 1177856        |
| train/                  |                |
|    approx_kl            | 1.09896064e-07 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -1.85          |
|    explained_variance   | -0.0539        |
|    learning_rate        | 1e-06          |
|    loss                 | 0.131          |
|    n_updates            | 46000          |
|    policy_gradient_loss | -1.61e-05      |
|    value_loss           | 0.228          |
--------------------------------------------
-------------------------------------------
| rollout/ 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 702           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4610          |
|    time_elapsed         | 8499          |
|    total_timesteps      | 1180160       |
| train/                  |               |
|    approx_kl            | 3.6600977e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0146       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.181         |
|    n_updates            | 46090         |
|    policy_gradient_loss | -4.84e-05     |
|    value_loss           | 0.257         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 702           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4619          |
|    time_elapsed         | 8516          |
|    total_timesteps      | 1182464       |
| train/                  |               |
|    approx_kl            | 3.5064295e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0222        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.052         |
|    n_updates            | 46180         |
|    policy_gradient_loss | -5.04e-05     |
|    value_loss           | 0.103         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 702          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4629         |
|    time_elapsed         | 8535         |
|    total_timesteps      | 1185024      |
| train/                  |              |
|    approx_kl            | 3.259629e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0022       |
|    learning_rate        | 1e-06        |
|    loss                 | 407          |
|    n_updates            | 46280        |
|    policy_gradient_loss | -1.02e-06    |
|    value_loss           | 767          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 702           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4639          |
|    time_elapsed         | 8554          |
|    total_timesteps      | 1187584       |
| train/                  |               |
|    approx_kl            | 1.6693957e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0685        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0527        |
|    n_updates            | 46380         |
|    policy_gradient_loss | -1.2e-05      |
|    value_loss           | 0.0986        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 702          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4648         |
|    time_elapsed         | 8571         |
|    total_timesteps      | 1189888      |
| train/                  |              |
|    approx_kl            | 6.922055e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.00231      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0428       |
|    n_updates            | 46470        |
|    policy_gradient_loss | -6.49e-05    |
|    value_loss           | 0.0873       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.67e+04    |
|    ep_rew_mean          | 702         |
| time/                   |             |
|    fps                  | 138         |
|    iterations           | 4658        |
|    time_elapsed         | 8591        |
|    total_timesteps      | 1192448     |
| train/                  |             |
|    approx_kl            | 6.33765e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.85       |
|    explained_variance   | -0.00123    |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0476      |
|    n_updates            | 46570       |
|    policy_gradient_loss | -7.25e-05   |
|    value_loss           | 0.0938      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 707           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4667          |
|    time_elapsed         | 8608          |
|    total_timesteps      | 1194752       |
| train/                  |               |
|    approx_kl            | 4.5145862e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.221         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0447        |
|    n_updates            | 46660         |
|    policy_gradient_loss | -4.87e-05     |
|    value_loss           | 0.0903        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 707           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4676          |
|    time_elapsed         | 8625          |
|    total_timesteps      | 1197056       |
| train/                  |               |
|    approx_kl            | 3.8184226e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.00441      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0545        |
|    n_updates            | 46750         |
|    policy_gradient_loss | -8.82e-06     |
|    value_loss           | 0.128         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 707          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4685         |
|    time_elapsed         | 8642         |
|    total_timesteps      | 1199360      |
| train/                  |              |
|    approx_kl            | 3.883615e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.000754    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0554       |
|    n_updates            | 46840        |
|    policy_gradient_loss | -5.38e-05    |
|    value_loss           | 0.0983       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 707           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4694          |
|    time_elapsed         | 8660          |
|    total_timesteps      | 1201664       |
| train/                  |               |
|    approx_kl            | 8.5355714e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.00206      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0633        |
|    n_updates            | 46930         |
|    policy_gradient_loss | -7.85e-05     |
|    value_loss           | 0.0948        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 710          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4704         |
|    time_elapsed         | 8678         |
|    total_timesteps      | 1204224      |
| train/                  |              |
|    approx_kl            | 9.080395e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0908       |
|    learning_rate        | 1e-06        |
|    loss                 | 461          |
|    n_updates            | 47030        |
|    policy_gradient_loss | 3.49e-07     |
|    value_loss           | 931          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

--------------------------------------------
| rollout/                |                |
|    ep_len_mean          | 1.65e+04       |
|    ep_rew_mean          | 710            |
| time/                   |                |
|    fps                  | 138            |
|    iterations           | 4713           |
|    time_elapsed         | 8695           |
|    total_timesteps      | 1206528        |
| train/                  |                |
|    approx_kl            | 1.14087015e-07 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -1.85          |
|    explained_variance   | -0.00555       |
|    learning_rate        | 1e-06          |
|    loss                 | 0.0466         |
|    n_updates            | 47120          |
|    policy_gradient_loss | -3.83e-06      |
|    value_loss           | 0.0968         |
--------------------------------------------
-------------------------------------------
| rollout/ 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 710           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4722          |
|    time_elapsed         | 8712          |
|    total_timesteps      | 1208832       |
| train/                  |               |
|    approx_kl            | 4.8452057e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0234        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0424        |
|    n_updates            | 47210         |
|    policy_gradient_loss | -8.92e-05     |
|    value_loss           | 0.088         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 710          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4731         |
|    time_elapsed         | 8730         |
|    total_timesteps      | 1211136      |
| train/                  |              |
|    approx_kl            | 5.177455e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.00352      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0362       |
|    n_updates            | 47300        |
|    policy_gradient_loss | -0.000165    |
|    value_loss           | 0.0905       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 710          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4740         |
|    time_elapsed         | 8747         |
|    total_timesteps      | 1213440      |
| train/                  |              |
|    approx_kl            | 7.096678e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.000916     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.134        |
|    n_updates            | 47390        |
|    policy_gradient_loss | -8.69e-05    |
|    value_loss           | 0.248        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 710           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4749          |
|    time_elapsed         | 8764          |
|    total_timesteps      | 1215744       |
| train/                  |               |
|    approx_kl            | 4.5751221e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0125       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.149         |
|    n_updates            | 47480         |
|    policy_gradient_loss | -5.6e-05      |
|    value_loss           | 0.283         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4758          |
|    time_elapsed         | 8781          |
|    total_timesteps      | 1218048       |
| train/                  |               |
|    approx_kl            | 4.5984052e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.169        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0651        |
|    n_updates            | 47570         |
|    policy_gradient_loss | -5.03e-05     |
|    value_loss           | 0.102         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4767          |
|    time_elapsed         | 8799          |
|    total_timesteps      | 1220352       |
| train/                  |               |
|    approx_kl            | 1.1173543e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0201        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0352        |
|    n_updates            | 47660         |
|    policy_gradient_loss | -0.000124     |
|    value_loss           | 0.0956        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4776          |
|    time_elapsed         | 8816          |
|    total_timesteps      | 1222656       |
| train/                  |               |
|    approx_kl            | 1.5094411e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.00321       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0457        |
|    n_updates            | 47750         |
|    policy_gradient_loss | -0.00016      |
|    value_loss           | 0.0884        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 711          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4786         |
|    time_elapsed         | 8835         |
|    total_timesteps      | 1225216      |
| train/                  |              |
|    approx_kl            | 7.497147e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.185        |
|    learning_rate        | 1e-06        |
|    loss                 | 207          |
|    n_updates            | 47850        |
|    policy_gradient_loss | 1.62e-05     |
|    value_loss           | 406          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 711          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4795         |
|    time_elapsed         | 8852         |
|    total_timesteps      | 1227520      |
| train/                  |              |
|    approx_kl            | 6.756745e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.000325     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.11         |
|    n_updates            | 47940        |
|    policy_gradient_loss | -6.96e-05    |
|    value_loss           | 0.226        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4804          |
|    time_elapsed         | 8869          |
|    total_timesteps      | 1229824       |
| train/                  |               |
|    approx_kl            | 1.0011718e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0108        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.104         |
|    n_updates            | 48030         |
|    policy_gradient_loss | -2.15e-05     |
|    value_loss           | 0.23          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4813          |
|    time_elapsed         | 8887          |
|    total_timesteps      | 1232128       |
| train/                  |               |
|    approx_kl            | 1.9394793e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.113         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0405        |
|    n_updates            | 48120         |
|    policy_gradient_loss | -5.89e-05     |
|    value_loss           | 0.0798        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4822          |
|    time_elapsed         | 8904          |
|    total_timesteps      | 1234432       |
| train/                  |               |
|    approx_kl            | 1.5925616e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0636       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0439        |
|    n_updates            | 48210         |
|    policy_gradient_loss | -3.68e-05     |
|    value_loss           | 0.107         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.64e+04     |
|    ep_rew_mean          | 711          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4831         |
|    time_elapsed         | 8921         |
|    total_timesteps      | 1236736      |
| train/                  |              |
|    approx_kl            | 5.213078e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0211      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0408       |
|    n_updates            | 48300        |
|    policy_gradient_loss | -0.000228    |
|    value_loss           | 0.0897       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.64e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4840          |
|    time_elapsed         | 8938          |
|    total_timesteps      | 1239040       |
| train/                  |               |
|    approx_kl            | 2.0489097e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.00184      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0514        |
|    n_updates            | 48390         |
|    policy_gradient_loss | -1.39e-05     |
|    value_loss           | 0.101         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4849          |
|    time_elapsed         | 8956          |
|    total_timesteps      | 1241344       |
| train/                  |               |
|    approx_kl            | 4.1676685e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.108         |
|    learning_rate        | 1e-06         |
|    loss                 | 565           |
|    n_updates            | 48480         |
|    policy_gradient_loss | 8.36e-07      |
|    value_loss           | 1.22e+03      |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4858          |
|    time_elapsed         | 8973          |
|    total_timesteps      | 1243648       |
| train/                  |               |
|    approx_kl            | 3.0570664e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0425        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0416        |
|    n_updates            | 48570         |
|    policy_gradient_loss | -2.53e-05     |
|    value_loss           | 0.0857        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4867          |
|    time_elapsed         | 8990          |
|    total_timesteps      | 1245952       |
| train/                  |               |
|    approx_kl            | 5.0570816e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0387       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.037         |
|    n_updates            | 48660         |
|    policy_gradient_loss | -5.98e-05     |
|    value_loss           | 0.0882        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 711          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4876         |
|    time_elapsed         | 9007         |
|    total_timesteps      | 1248256      |
| train/                  |              |
|    approx_kl            | 4.898757e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0677       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0322       |
|    n_updates            | 48750        |
|    policy_gradient_loss | -5.53e-05    |
|    value_loss           | 0.102        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4885          |
|    time_elapsed         | 9025          |
|    total_timesteps      | 1250560       |
| train/                  |               |
|    approx_kl            | 1.1338852e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0167       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.135         |
|    n_updates            | 48840         |
|    policy_gradient_loss | -2.4e-05      |
|    value_loss           | 0.251         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4894          |
|    time_elapsed         | 9042          |
|    total_timesteps      | 1252864       |
| train/                  |               |
|    approx_kl            | 2.3981556e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.000525      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.159         |
|    n_updates            | 48930         |
|    policy_gradient_loss | -1.45e-05     |
|    value_loss           | 0.225         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.65e+04    |
|    ep_rew_mean          | 711         |
| time/                   |             |
|    fps                  | 138         |
|    iterations           | 4903        |
|    time_elapsed         | 9059        |
|    total_timesteps      | 1255168     |
| train/                  |             |
|    approx_kl            | 4.60539e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.85       |
|    explained_variance   | 0.000646    |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0382      |
|    n_updates            | 49020       |
|    policy_gradient_loss | -4.5e-05    |
|    value_loss           | 0.0872      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 711          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4912         |
|    time_elapsed         | 9076         |
|    total_timesteps      | 1257472      |
| train/                  |              |
|    approx_kl            | 9.313226e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.126        |
|    learning_rate        | 1e-06        |
|    loss                 | 642          |
|    n_updates            | 49110        |
|    policy_gradient_loss | -1.57e-06    |
|    value_loss           | 1.27e+03     |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 711          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4921         |
|    time_elapsed         | 9093         |
|    total_timesteps      | 1259776      |
| train/                  |              |
|    approx_kl            | 6.421469e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0927       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0439       |
|    n_updates            | 49200        |
|    policy_gradient_loss | -7.92e-05    |
|    value_loss           | 0.0894       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.65e+04     |
|    ep_rew_mean          | 711          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4930         |
|    time_elapsed         | 9111         |
|    total_timesteps      | 1262080      |
| train/                  |              |
|    approx_kl            | 4.558824e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.00154     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0433       |
|    n_updates            | 49290        |
|    policy_gradient_loss | -3.47e-05    |
|    value_loss           | 0.0891       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.65e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4939          |
|    time_elapsed         | 9128          |
|    total_timesteps      | 1264384       |
| train/                  |               |
|    approx_kl            | 2.5052577e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.00621       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0526        |
|    n_updates            | 49380         |
|    policy_gradient_loss | -7.07e-05     |
|    value_loss           | 0.088         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4948          |
|    time_elapsed         | 9144          |
|    total_timesteps      | 1266688       |
| train/                  |               |
|    approx_kl            | 2.5404152e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0162       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0445        |
|    n_updates            | 49470         |
|    policy_gradient_loss | -0.000132     |
|    value_loss           | 0.0875        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4957          |
|    time_elapsed         | 9161          |
|    total_timesteps      | 1268992       |
| train/                  |               |
|    approx_kl            | 5.0477684e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.000228      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0426        |
|    n_updates            | 49560         |
|    policy_gradient_loss | -5.32e-05     |
|    value_loss           | 0.0879        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4966          |
|    time_elapsed         | 9179          |
|    total_timesteps      | 1271296       |
| train/                  |               |
|    approx_kl            | 1.9138679e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0164        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0535        |
|    n_updates            | 49650         |
|    policy_gradient_loss | -4.33e-05     |
|    value_loss           | 0.109         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 708          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4975         |
|    time_elapsed         | 9196         |
|    total_timesteps      | 1273600      |
| train/                  |              |
|    approx_kl            | 7.916242e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.108        |
|    learning_rate        | 1e-06        |
|    loss                 | 260          |
|    n_updates            | 49740        |
|    policy_gradient_loss | -7.66e-07    |
|    value_loss           | 581          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 4984          |
|    time_elapsed         | 9213          |
|    total_timesteps      | 1275904       |
| train/                  |               |
|    approx_kl            | 4.4330955e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.00687       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.152         |
|    n_updates            | 49830         |
|    policy_gradient_loss | -5.7e-05      |
|    value_loss           | 0.218         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 708          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 4993         |
|    time_elapsed         | 9230         |
|    total_timesteps      | 1278208      |
| train/                  |              |
|    approx_kl            | 7.392373e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0103       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.129        |
|    n_updates            | 49920        |
|    policy_gradient_loss | -9.12e-05    |
|    value_loss           | 0.208        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 708          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5002         |
|    time_elapsed         | 9248         |
|    total_timesteps      | 1280512      |
| train/                  |              |
|    approx_kl            | 8.966308e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.000314     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0588       |
|    n_updates            | 50010        |
|    policy_gradient_loss | -0.000102    |
|    value_loss           | 0.0941       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5011          |
|    time_elapsed         | 9265          |
|    total_timesteps      | 1282816       |
| train/                  |               |
|    approx_kl            | 2.9453076e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.249         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0322        |
|    n_updates            | 50100         |
|    policy_gradient_loss | -5.06e-05     |
|    value_loss           | 0.0717        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.66e+04     |
|    ep_rew_mean          | 708          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5020         |
|    time_elapsed         | 9282         |
|    total_timesteps      | 1285120      |
| train/                  |              |
|    approx_kl            | 2.544839e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0405       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0432       |
|    n_updates            | 50190        |
|    policy_gradient_loss | -4.02e-05    |
|    value_loss           | 0.0839       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.66e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5029          |
|    time_elapsed         | 9299          |
|    total_timesteps      | 1287424       |
| train/                  |               |
|    approx_kl            | 3.1874515e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.000164      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0419        |
|    n_updates            | 50280         |
|    policy_gradient_loss | -4.48e-05     |
|    value_loss           | 0.0924        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5038          |
|    time_elapsed         | 9316          |
|    total_timesteps      | 1289728       |
| train/                  |               |
|    approx_kl            | 1.1175871e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0554        |
|    learning_rate        | 1e-06         |
|    loss                 | 130           |
|    n_updates            | 50370         |
|    policy_gradient_loss | -3.37e-06     |
|    value_loss           | 312           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5047          |
|    time_elapsed         | 9334          |
|    total_timesteps      | 1292032       |
| train/                  |               |
|    approx_kl            | 2.5168993e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0377        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0462        |
|    n_updates            | 50460         |
|    policy_gradient_loss | -5.69e-05     |
|    value_loss           | 0.0894        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5056          |
|    time_elapsed         | 9351          |
|    total_timesteps      | 1294336       |
| train/                  |               |
|    approx_kl            | 1.1478551e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.183         |
|    learning_rate        | 1e-06         |
|    loss                 | 78.5          |
|    n_updates            | 50550         |
|    policy_gradient_loss | -2.08e-05     |
|    value_loss           | 168           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5065          |
|    time_elapsed         | 9368          |
|    total_timesteps      | 1296640       |
| train/                  |               |
|    approx_kl            | 3.2358803e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.00813      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0457        |
|    n_updates            | 50640         |
|    policy_gradient_loss | -9.81e-05     |
|    value_loss           | 0.0963        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5074          |
|    time_elapsed         | 9385          |
|    total_timesteps      | 1298944       |
| train/                  |               |
|    approx_kl            | 1.4142133e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.000291     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.124         |
|    n_updates            | 50730         |
|    policy_gradient_loss | -0.000131     |
|    value_loss           | 0.231         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 709          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5083         |
|    time_elapsed         | 9402         |
|    total_timesteps      | 1301248      |
| train/                  |              |
|    approx_kl            | 5.699694e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.00761     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.146        |
|    n_updates            | 50820        |
|    policy_gradient_loss | -5.77e-05    |
|    value_loss           | 0.24         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 709          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5092         |
|    time_elapsed         | 9419         |
|    total_timesteps      | 1303552      |
| train/                  |              |
|    approx_kl            | 1.099892e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.04         |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0417       |
|    n_updates            | 50910        |
|    policy_gradient_loss | -0.000121    |
|    value_loss           | 0.085        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 709          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5101         |
|    time_elapsed         | 9436         |
|    total_timesteps      | 1305856      |
| train/                  |              |
|    approx_kl            | 4.377216e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0721      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0391       |
|    n_updates            | 51000        |
|    policy_gradient_loss | -1.24e-06    |
|    value_loss           | 0.131        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.67e+04     |
|    ep_rew_mean          | 709          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5110         |
|    time_elapsed         | 9453         |
|    total_timesteps      | 1308160      |
| train/                  |              |
|    approx_kl            | 1.701992e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0276      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0481       |
|    n_updates            | 51090        |
|    policy_gradient_loss | -2.8e-05     |
|    value_loss           | 0.0949       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5119          |
|    time_elapsed         | 9471          |
|    total_timesteps      | 1310464       |
| train/                  |               |
|    approx_kl            | 1.0111835e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0542       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0421        |
|    n_updates            | 51180         |
|    policy_gradient_loss | -0.000105     |
|    value_loss           | 0.0893        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.67e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5129          |
|    time_elapsed         | 9489          |
|    total_timesteps      | 1313024       |
| train/                  |               |
|    approx_kl            | 1.5213154e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 1.52e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0515        |
|    n_updates            | 51280         |
|    policy_gradient_loss | -0.000123     |
|    value_loss           | 0.101         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 709          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5138         |
|    time_elapsed         | 9506         |
|    total_timesteps      | 1315328      |
| train/                  |              |
|    approx_kl            | 4.323665e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.00499     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0472       |
|    n_updates            | 51370        |
|    policy_gradient_loss | -4.55e-05    |
|    value_loss           | 0.091        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5147          |
|    time_elapsed         | 9523          |
|    total_timesteps      | 1317632       |
| train/                  |               |
|    approx_kl            | 6.3795596e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.076        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0527        |
|    n_updates            | 51460         |
|    policy_gradient_loss | -7.57e-05     |
|    value_loss           | 0.095         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5156          |
|    time_elapsed         | 9540          |
|    total_timesteps      | 1319936       |
| train/                  |               |
|    approx_kl            | 8.5355714e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.000835     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0399        |
|    n_updates            | 51550         |
|    policy_gradient_loss | -9.63e-05     |
|    value_loss           | 0.0875        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 709          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5165         |
|    time_elapsed         | 9558         |
|    total_timesteps      | 1322240      |
| train/                  |              |
|    approx_kl            | 7.892959e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0511      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0844       |
|    n_updates            | 51640        |
|    policy_gradient_loss | -1.97e-05    |
|    value_loss           | 0.206        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 709          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5175         |
|    time_elapsed         | 9576         |
|    total_timesteps      | 1324800      |
| train/                  |              |
|    approx_kl            | 2.477318e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.00161     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.122        |
|    n_updates            | 51740        |
|    policy_gradient_loss | -3.12e-05    |
|    value_loss           | 0.245        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5184          |
|    time_elapsed         | 9593          |
|    total_timesteps      | 1327104       |
| train/                  |               |
|    approx_kl            | 1.2947712e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 9.54e-07      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0384        |
|    n_updates            | 51830         |
|    policy_gradient_loss | -0.000165     |
|    value_loss           | 0.0931        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

--------------------------------------------
| rollout/                |                |
|    ep_len_mean          | 1.68e+04       |
|    ep_rew_mean          | 709            |
| time/                   |                |
|    fps                  | 138            |
|    iterations           | 5193           |
|    time_elapsed         | 9610           |
|    total_timesteps      | 1329408        |
| train/                  |                |
|    approx_kl            | 1.17812306e-07 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -1.85          |
|    explained_variance   | 0.413          |
|    learning_rate        | 1e-06          |
|    loss                 | 3.49           |
|    n_updates            | 51920          |
|    policy_gradient_loss | 2.5e-05        |
|    value_loss           | 24.6           |
--------------------------------------------
-------------------------------------------
| rollout/ 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 709          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5202         |
|    time_elapsed         | 9628         |
|    total_timesteps      | 1331712      |
| train/                  |              |
|    approx_kl            | 4.749745e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.127        |
|    learning_rate        | 1e-06        |
|    loss                 | 82.3         |
|    n_updates            | 52010        |
|    policy_gradient_loss | -9.44e-06    |
|    value_loss           | 172          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.68e+04    |
|    ep_rew_mean          | 709         |
| time/                   |             |
|    fps                  | 138         |
|    iterations           | 5211        |
|    time_elapsed         | 9645        |
|    total_timesteps      | 1334016     |
| train/                  |             |
|    approx_kl            | 3.16184e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.85       |
|    explained_variance   | -0.000352   |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0368      |
|    n_updates            | 52100       |
|    policy_gradient_loss | -3.63e-05   |
|    value_loss           | 0.106       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 709           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5220          |
|    time_elapsed         | 9662          |
|    total_timesteps      | 1336320       |
| train/                  |               |
|    approx_kl            | 7.0920214e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.00424      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0442        |
|    n_updates            | 52190         |
|    policy_gradient_loss | -6.18e-05     |
|    value_loss           | 0.0886        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 706           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5229          |
|    time_elapsed         | 9679          |
|    total_timesteps      | 1338624       |
| train/                  |               |
|    approx_kl            | 1.6884878e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0612       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0501        |
|    n_updates            | 52280         |
|    policy_gradient_loss | -3.59e-05     |
|    value_loss           | 0.0947        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 706          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5238         |
|    time_elapsed         | 9697         |
|    total_timesteps      | 1340928      |
| train/                  |              |
|    approx_kl            | 9.336509e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0237       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0367       |
|    n_updates            | 52370        |
|    policy_gradient_loss | -0.000134    |
|    value_loss           | 0.0858       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 706           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5248          |
|    time_elapsed         | 9715          |
|    total_timesteps      | 1343488       |
| train/                  |               |
|    approx_kl            | 7.4109994e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0965        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0395        |
|    n_updates            | 52470         |
|    policy_gradient_loss | -9.26e-05     |
|    value_loss           | 0.0801        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 706           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5257          |
|    time_elapsed         | 9732          |
|    total_timesteps      | 1345792       |
| train/                  |               |
|    approx_kl            | 3.3993274e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.047         |
|    learning_rate        | 1e-06         |
|    loss                 | 451           |
|    n_updates            | 52560         |
|    policy_gradient_loss | -2.36e-07     |
|    value_loss           | 891           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 706           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5266          |
|    time_elapsed         | 9749          |
|    total_timesteps      | 1348096       |
| train/                  |               |
|    approx_kl            | 1.1015218e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.000141     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.12          |
|    n_updates            | 52650         |
|    policy_gradient_loss | -0.000121     |
|    value_loss           | 0.229         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.69e+04    |
|    ep_rew_mean          | 706         |
| time/                   |             |
|    fps                  | 138         |
|    iterations           | 5275        |
|    time_elapsed         | 9767        |
|    total_timesteps      | 1350400     |
| train/                  |             |
|    approx_kl            | 4.45568e-06 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | -0.000337   |
|    learning_rate        | 1e-06       |
|    loss                 | 0.103       |
|    n_updates            | 52740       |
|    policy_gradient_loss | -0.000183   |
|    value_loss           | 0.208       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 706           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5285          |
|    time_elapsed         | 9786          |
|    total_timesteps      | 1352960       |
| train/                  |               |
|    approx_kl            | 2.7490314e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0156       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0437        |
|    n_updates            | 52840         |
|    policy_gradient_loss | -5.96e-05     |
|    value_loss           | 0.088         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 705           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5294          |
|    time_elapsed         | 9803          |
|    total_timesteps      | 1355264       |
| train/                  |               |
|    approx_kl            | 4.7194771e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0003        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0357        |
|    n_updates            | 52930         |
|    policy_gradient_loss | -4.71e-05     |
|    value_loss           | 0.0919        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 705          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5303         |
|    time_elapsed         | 9820         |
|    total_timesteps      | 1357568      |
| train/                  |              |
|    approx_kl            | 1.876615e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0465      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0541       |
|    n_updates            | 53020        |
|    policy_gradient_loss | -2.91e-05    |
|    value_loss           | 0.0981       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 705           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5312          |
|    time_elapsed         | 9838          |
|    total_timesteps      | 1359872       |
| train/                  |               |
|    approx_kl            | 1.6444828e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00625       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0496        |
|    n_updates            | 53110         |
|    policy_gradient_loss | -0.000142     |
|    value_loss           | 0.0858        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 705          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5321         |
|    time_elapsed         | 9855         |
|    total_timesteps      | 1362176      |
| train/                  |              |
|    approx_kl            | 4.703179e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.186       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0948       |
|    n_updates            | 53200        |
|    policy_gradient_loss | -1.3e-05     |
|    value_loss           | 0.227        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.69e+04    |
|    ep_rew_mean          | 705         |
| time/                   |             |
|    fps                  | 138         |
|    iterations           | 5330        |
|    time_elapsed         | 9873        |
|    total_timesteps      | 1364480     |
| train/                  |             |
|    approx_kl            | 6.91507e-08 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | 0.022       |
|    learning_rate        | 1e-06       |
|    loss                 | 0.127       |
|    n_updates            | 53290       |
|    policy_gradient_loss | -1.4e-05    |
|    value_loss           | 0.225       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 705           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5339          |
|    time_elapsed         | 9890          |
|    total_timesteps      | 1366784       |
| train/                  |               |
|    approx_kl            | 1.1958182e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -3.91e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0694        |
|    n_updates            | 53380         |
|    policy_gradient_loss | -0.000143     |
|    value_loss           | 0.228         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 705          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5348         |
|    time_elapsed         | 9907         |
|    total_timesteps      | 1369088      |
| train/                  |              |
|    approx_kl            | 4.703179e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0648       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0407       |
|    n_updates            | 53470        |
|    policy_gradient_loss | -5.98e-05    |
|    value_loss           | 0.0891       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 705          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5358         |
|    time_elapsed         | 9926         |
|    total_timesteps      | 1371648      |
| train/                  |              |
|    approx_kl            | 2.256129e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0981      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0461       |
|    n_updates            | 53570        |
|    policy_gradient_loss | -2.76e-05    |
|    value_loss           | 0.0949       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 705           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5367          |
|    time_elapsed         | 9944          |
|    total_timesteps      | 1373952       |
| train/                  |               |
|    approx_kl            | 3.1781383e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0487        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0423        |
|    n_updates            | 53660         |
|    policy_gradient_loss | -4.45e-05     |
|    value_loss           | 0.0828        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 707          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5376         |
|    time_elapsed         | 9961         |
|    total_timesteps      | 1376256      |
| train/                  |              |
|    approx_kl            | 7.683411e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0116       |
|    learning_rate        | 1e-06        |
|    loss                 | 326          |
|    n_updates            | 53750        |
|    policy_gradient_loss | -1.34e-06    |
|    value_loss           | 579          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 707          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5386         |
|    time_elapsed         | 9980         |
|    total_timesteps      | 1378816      |
| train/                  |              |
|    approx_kl            | 2.430752e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.0148       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0372       |
|    n_updates            | 53850        |
|    policy_gradient_loss | -2.67e-05    |
|    value_loss           | 0.0875       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 707           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5395          |
|    time_elapsed         | 9998          |
|    total_timesteps      | 1381120       |
| train/                  |               |
|    approx_kl            | 1.5359838e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.00351       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0372        |
|    n_updates            | 53940         |
|    policy_gradient_loss | -0.00014      |
|    value_loss           | 0.0889        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 707           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5404          |
|    time_elapsed         | 10015         |
|    total_timesteps      | 1383424       |
| train/                  |               |
|    approx_kl            | 3.9068982e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0515       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0431        |
|    n_updates            | 54030         |
|    policy_gradient_loss | -4.59e-05     |
|    value_loss           | 0.0892        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 707          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5413         |
|    time_elapsed         | 10032        |
|    total_timesteps      | 1385728      |
| train/                  |              |
|    approx_kl            | 1.352746e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.00807      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0888       |
|    n_updates            | 54120        |
|    policy_gradient_loss | -0.000172    |
|    value_loss           | 0.202        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 707          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5422         |
|    time_elapsed         | 10050        |
|    total_timesteps      | 1388032      |
| train/                  |              |
|    approx_kl            | 1.124572e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -8.87e-05    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.116        |
|    n_updates            | 54210        |
|    policy_gradient_loss | -8.6e-06     |
|    value_loss           | 0.209        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 707           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5431          |
|    time_elapsed         | 10068         |
|    total_timesteps      | 1390336       |
| train/                  |               |
|    approx_kl            | 7.1595423e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0609       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0508        |
|    n_updates            | 54300         |
|    policy_gradient_loss | -6.98e-05     |
|    value_loss           | 0.12          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 707          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5440         |
|    time_elapsed         | 10085        |
|    total_timesteps      | 1392640      |
| train/                  |              |
|    approx_kl            | 9.755604e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0265      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0322       |
|    n_updates            | 54390        |
|    policy_gradient_loss | -2.28e-05    |
|    value_loss           | 0.0935       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 707           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5449          |
|    time_elapsed         | 10102         |
|    total_timesteps      | 1394944       |
| train/                  |               |
|    approx_kl            | 1.2684613e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0382       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0543        |
|    n_updates            | 54480         |
|    policy_gradient_loss | -0.000141     |
|    value_loss           | 0.0957        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 707           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5458          |
|    time_elapsed         | 10119         |
|    total_timesteps      | 1397248       |
| train/                  |               |
|    approx_kl            | 5.3690746e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 5.42e-06      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0415        |
|    n_updates            | 54570         |
|    policy_gradient_loss | -6.82e-05     |
|    value_loss           | 0.0879        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 707          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5467         |
|    time_elapsed         | 10136        |
|    total_timesteps      | 1399552      |
| train/                  |              |
|    approx_kl            | 3.213063e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0411      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.029        |
|    n_updates            | 54660        |
|    policy_gradient_loss | -1.03e-05    |
|    value_loss           | 0.0859       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5476          |
|    time_elapsed         | 10154         |
|    total_timesteps      | 1401856       |
| train/                  |               |
|    approx_kl            | 2.9569492e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.000365     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0592        |
|    n_updates            | 54750         |
|    policy_gradient_loss | -6.55e-06     |
|    value_loss           | 0.172         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 708          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5485         |
|    time_elapsed         | 10171        |
|    total_timesteps      | 1404160      |
| train/                  |              |
|    approx_kl            | 9.546056e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | 0.098        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0412       |
|    n_updates            | 54840        |
|    policy_gradient_loss | -9.39e-05    |
|    value_loss           | 0.101        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5494          |
|    time_elapsed         | 10188         |
|    total_timesteps      | 1406464       |
| train/                  |               |
|    approx_kl            | 2.7101487e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0415        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0462        |
|    n_updates            | 54930         |
|    policy_gradient_loss | -5.48e-05     |
|    value_loss           | 0.0865        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5503          |
|    time_elapsed         | 10205         |
|    total_timesteps      | 1408768       |
| train/                  |               |
|    approx_kl            | 1.3895333e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.000147     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.121         |
|    n_updates            | 55020         |
|    policy_gradient_loss | -0.000109     |
|    value_loss           | 0.213         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5513          |
|    time_elapsed         | 10224         |
|    total_timesteps      | 1411328       |
| train/                  |               |
|    approx_kl            | 5.1455572e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0516        |
|    learning_rate        | 1e-06         |
|    loss                 | 381           |
|    n_updates            | 55120         |
|    policy_gradient_loss | -6.1e-06      |
|    value_loss           | 966           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 708          |
| time/                   |              |
|    fps                  | 138          |
|    iterations           | 5522         |
|    time_elapsed         | 10241        |
|    total_timesteps      | 1413632      |
| train/                  |              |
|    approx_kl            | 4.216563e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.85        |
|    explained_variance   | -0.0122      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0516       |
|    n_updates            | 55210        |
|    policy_gradient_loss | -4.59e-05    |
|    value_loss           | 0.0896       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5531          |
|    time_elapsed         | 10258         |
|    total_timesteps      | 1415936       |
| train/                  |               |
|    approx_kl            | 2.8521754e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.00319       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0593        |
|    n_updates            | 55300         |
|    policy_gradient_loss | -2.17e-05     |
|    value_loss           | 0.101         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 708           |
| time/                   |               |
|    fps                  | 138           |
|    iterations           | 5540          |
|    time_elapsed         | 10275         |
|    total_timesteps      | 1418240       |
| train/                  |               |
|    approx_kl            | 2.4889596e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0804       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0469        |
|    n_updates            | 55390         |
|    policy_gradient_loss | -3.32e-05     |
|    value_loss           | 0.0993        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5549          |
|    time_elapsed         | 10293         |
|    total_timesteps      | 1420544       |
| train/                  |               |
|    approx_kl            | 3.7485734e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0249       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0598        |
|    n_updates            | 55480         |
|    policy_gradient_loss | -1.04e-05     |
|    value_loss           | 0.15          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5558          |
|    time_elapsed         | 10310         |
|    total_timesteps      | 1422848       |
| train/                  |               |
|    approx_kl            | 2.1629967e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0413       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0494        |
|    n_updates            | 55570         |
|    policy_gradient_loss | -2.47e-05     |
|    value_loss           | 0.101         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 711           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5567          |
|    time_elapsed         | 10327         |
|    total_timesteps      | 1425152       |
| train/                  |               |
|    approx_kl            | 2.9732473e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | 0.0975        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0447        |
|    n_updates            | 55660         |
|    policy_gradient_loss | -3.54e-05     |
|    value_loss           | 0.0793        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5576          |
|    time_elapsed         | 10344         |
|    total_timesteps      | 1427456       |
| train/                  |               |
|    approx_kl            | 5.4435804e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0279        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0367        |
|    n_updates            | 55750         |
|    policy_gradient_loss | -5.29e-05     |
|    value_loss           | 0.0791        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5585          |
|    time_elapsed         | 10361         |
|    total_timesteps      | 1429760       |
| train/                  |               |
|    approx_kl            | 1.5785918e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0268        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0451        |
|    n_updates            | 55840         |
|    policy_gradient_loss | -1.37e-05     |
|    value_loss           | 0.0933        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5594          |
|    time_elapsed         | 10379         |
|    total_timesteps      | 1432064       |
| train/                  |               |
|    approx_kl            | 1.2526289e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.243         |
|    learning_rate        | 1e-06         |
|    loss                 | 82.4          |
|    n_updates            | 55930         |
|    policy_gradient_loss | 9.6e-06       |
|    value_loss           | 176           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5603          |
|    time_elapsed         | 10396         |
|    total_timesteps      | 1434368       |
| train/                  |               |
|    approx_kl            | 3.0803494e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.226        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0457        |
|    n_updates            | 56020         |
|    policy_gradient_loss | -3.96e-05     |
|    value_loss           | 0.114         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5612          |
|    time_elapsed         | 10414         |
|    total_timesteps      | 1436672       |
| train/                  |               |
|    approx_kl            | 4.4470653e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.216        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0901        |
|    n_updates            | 56110         |
|    policy_gradient_loss | -1.15e-05     |
|    value_loss           | 0.252         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 716          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5621         |
|    time_elapsed         | 10430        |
|    total_timesteps      | 1438976      |
| train/                  |              |
|    approx_kl            | 6.570481e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00109     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.073        |
|    n_updates            | 56200        |
|    policy_gradient_loss | -7.3e-05     |
|    value_loss           | 0.221        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5630          |
|    time_elapsed         | 10448         |
|    total_timesteps      | 1441280       |
| train/                  |               |
|    approx_kl            | 8.7940134e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0184        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0808        |
|    n_updates            | 56290         |
|    policy_gradient_loss | -0.000114     |
|    value_loss           | 0.12          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.7e+04    |
|    ep_rew_mean          | 715        |
| time/                   |            |
|    fps                  | 137        |
|    iterations           | 5639       |
|    time_elapsed         | 10465      |
|    total_timesteps      | 1443584    |
| train/                  |            |
|    approx_kl            | 5.3111e-06 |
|    clip_fraction        | 0          |
|    clip_range           | 0.2        |
|    entropy_loss         | -1.84      |
|    explained_variance   | -0.0158    |
|    learning_rate        | 1e-06      |
|    loss                 | 0.0407     |
|    n_updates            | 56380      |
|    policy_gradient_loss | -0.00034   |
|    value_loss           | 0.0906     |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_re

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5649          |
|    time_elapsed         | 10484         |
|    total_timesteps      | 1446144       |
| train/                  |               |
|    approx_kl            | 1.6232952e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0151        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0668        |
|    n_updates            | 56480         |
|    policy_gradient_loss | -7.77e-05     |
|    value_loss           | 0.115         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5658          |
|    time_elapsed         | 10501         |
|    total_timesteps      | 1448448       |
| train/                  |               |
|    approx_kl            | 1.7718412e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0383       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0401        |
|    n_updates            | 56570         |
|    policy_gradient_loss | -2.76e-05     |
|    value_loss           | 0.0897        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.68e+04    |
|    ep_rew_mean          | 718         |
| time/                   |             |
|    fps                  | 137         |
|    iterations           | 5667        |
|    time_elapsed         | 10519       |
|    total_timesteps      | 1450752     |
| train/                  |             |
|    approx_kl            | 8.71974e-06 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | 0.00437     |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0523      |
|    n_updates            | 56660       |
|    policy_gradient_loss | -0.000306   |
|    value_loss           | 0.0966      |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5676          |
|    time_elapsed         | 10536         |
|    total_timesteps      | 1453056       |
| train/                  |               |
|    approx_kl            | 3.1245872e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0923       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0413        |
|    n_updates            | 56750         |
|    policy_gradient_loss | -4.24e-05     |
|    value_loss           | 0.0937        |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5685          |
|    time_elapsed         | 10553         |
|    total_timesteps      | 1455360       |
| train/                  |               |
|    approx_kl            | 2.8056093e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0145        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.151         |
|    n_updates            | 56840         |
|    policy_gradient_loss | -3.19e-05     |
|    value_loss           | 0.229         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5694          |
|    time_elapsed         | 10570         |
|    total_timesteps      | 1457664       |
| train/                  |               |
|    approx_kl            | 1.2081582e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0826       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.152         |
|    n_updates            | 56930         |
|    policy_gradient_loss | -0.000123     |
|    value_loss           | 0.231         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5703          |
|    time_elapsed         | 10587         |
|    total_timesteps      | 1459968       |
| train/                  |               |
|    approx_kl            | 2.0978041e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0655       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0503        |
|    n_updates            | 57020         |
|    policy_gradient_loss | -2.57e-05     |
|    value_loss           | 0.108         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5712          |
|    time_elapsed         | 10605         |
|    total_timesteps      | 1462272       |
| train/                  |               |
|    approx_kl            | 3.1897798e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0128        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0605        |
|    n_updates            | 57110         |
|    policy_gradient_loss | -1.47e-05     |
|    value_loss           | 0.21          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5721          |
|    time_elapsed         | 10622         |
|    total_timesteps      | 1464576       |
| train/                  |               |
|    approx_kl            | 5.6484714e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0141        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0334        |
|    n_updates            | 57200         |
|    policy_gradient_loss | -4.75e-05     |
|    value_loss           | 0.111         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 718          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5730         |
|    time_elapsed         | 10639        |
|    total_timesteps      | 1466880      |
| train/                  |              |
|    approx_kl            | 7.895287e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0429      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0477       |
|    n_updates            | 57290        |
|    policy_gradient_loss | -4.38e-05    |
|    value_loss           | 0.0878       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 718          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5739         |
|    time_elapsed         | 10656        |
|    total_timesteps      | 1469184      |
| train/                  |              |
|    approx_kl            | 6.540213e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00035      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0602       |
|    n_updates            | 57380        |
|    policy_gradient_loss | -7.01e-05    |
|    value_loss           | 0.119        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 719          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5748         |
|    time_elapsed         | 10674        |
|    total_timesteps      | 1471488      |
| train/                  |              |
|    approx_kl            | 1.791399e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.011       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0565       |
|    n_updates            | 57470        |
|    policy_gradient_loss | -1.99e-05    |
|    value_loss           | 0.107        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.69e+04    |
|    ep_rew_mean          | 719         |
| time/                   |             |
|    fps                  | 137         |
|    iterations           | 5757        |
|    time_elapsed         | 10691       |
|    total_timesteps      | 1473792     |
| train/                  |             |
|    approx_kl            | 1.86963e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | -0.0621     |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0493      |
|    n_updates            | 57560       |
|    policy_gradient_loss | -3.83e-05   |
|    value_loss           | 0.101       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 719          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5767         |
|    time_elapsed         | 10710        |
|    total_timesteps      | 1476352      |
| train/                  |              |
|    approx_kl            | 5.213078e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0365      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0487       |
|    n_updates            | 57660        |
|    policy_gradient_loss | -9.81e-05    |
|    value_loss           | 0.0941       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 719           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5776          |
|    time_elapsed         | 10727         |
|    total_timesteps      | 1478656       |
| train/                  |               |
|    approx_kl            | 8.8708475e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0623        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0837        |
|    n_updates            | 57750         |
|    policy_gradient_loss | -1.44e-05     |
|    value_loss           | 0.228         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 719           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5785          |
|    time_elapsed         | 10745         |
|    total_timesteps      | 1480960       |
| train/                  |               |
|    approx_kl            | 1.3313256e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00472      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.108         |
|    n_updates            | 57840         |
|    policy_gradient_loss | -0.00014      |
|    value_loss           | 0.223         |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 719           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5794          |
|    time_elapsed         | 10761         |
|    total_timesteps      | 1483264       |
| train/                  |               |
|    approx_kl            | 2.5122426e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0319       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0453        |
|    n_updates            | 57930         |
|    policy_gradient_loss | -3.02e-05     |
|    value_loss           | 0.0969        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 715          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5803         |
|    time_elapsed         | 10779        |
|    total_timesteps      | 1485568      |
| train/                  |              |
|    approx_kl            | 8.700881e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -9.3e-05     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0385       |
|    n_updates            | 58020        |
|    policy_gradient_loss | -8.29e-05    |
|    value_loss           | 0.0911       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5812          |
|    time_elapsed         | 10796         |
|    total_timesteps      | 1487872       |
| train/                  |               |
|    approx_kl            | 7.7998266e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0519       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0404        |
|    n_updates            | 58110         |
|    policy_gradient_loss | -2.49e-05     |
|    value_loss           | 0.0862        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5821          |
|    time_elapsed         | 10813         |
|    total_timesteps      | 1490176       |
| train/                  |               |
|    approx_kl            | 1.2549572e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.119         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0384        |
|    n_updates            | 58200         |
|    policy_gradient_loss | -2.78e-05     |
|    value_loss           | 0.0785        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 715          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5830         |
|    time_elapsed         | 10830        |
|    total_timesteps      | 1492480      |
| train/                  |              |
|    approx_kl            | 6.263144e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0663       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0388       |
|    n_updates            | 58290        |
|    policy_gradient_loss | -1.05e-06    |
|    value_loss           | 0.082        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5839          |
|    time_elapsed         | 10847         |
|    total_timesteps      | 1494784       |
| train/                  |               |
|    approx_kl            | 4.7730282e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.000209      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.136         |
|    n_updates            | 58380         |
|    policy_gradient_loss | -1.29e-05     |
|    value_loss           | 0.274         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 715          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5848         |
|    time_elapsed         | 10865        |
|    total_timesteps      | 1497088      |
| train/                  |              |
|    approx_kl            | 4.810281e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00676      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.148        |
|    n_updates            | 58470        |
|    policy_gradient_loss | -7.13e-05    |
|    value_loss           | 0.239        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5857          |
|    time_elapsed         | 10882         |
|    total_timesteps      | 1499392       |
| train/                  |               |
|    approx_kl            | 8.2771294e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.000385      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.046         |
|    n_updates            | 58560         |
|    policy_gradient_loss | -9.14e-05     |
|    value_loss           | 0.102         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5866          |
|    time_elapsed         | 10899         |
|    total_timesteps      | 1501696       |
| train/                  |               |
|    approx_kl            | 2.0908192e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0148        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0366        |
|    n_updates            | 58650         |
|    policy_gradient_loss | -2.37e-05     |
|    value_loss           | 0.0897        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 715          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5875         |
|    time_elapsed         | 10916        |
|    total_timesteps      | 1504000      |
| train/                  |              |
|    approx_kl            | 9.660143e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.115       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0494       |
|    n_updates            | 58740        |
|    policy_gradient_loss | -9.24e-05    |
|    value_loss           | 0.0898       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5884          |
|    time_elapsed         | 10933         |
|    total_timesteps      | 1506304       |
| train/                  |               |
|    approx_kl            | 1.8181745e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.000335     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0385        |
|    n_updates            | 58830         |
|    policy_gradient_loss | -0.000174     |
|    value_loss           | 0.0877        |
-------------------------------------------
----------------------------------------
| rollout/                |        

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 717           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5894          |
|    time_elapsed         | 10952         |
|    total_timesteps      | 1508864       |
| train/                  |               |
|    approx_kl            | 1.4901161e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0561        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.068         |
|    n_updates            | 58930         |
|    policy_gradient_loss | 4.52e-06      |
|    value_loss           | 0.146         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 717          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5903         |
|    time_elapsed         | 10970        |
|    total_timesteps      | 1511168      |
| train/                  |              |
|    approx_kl            | 5.264301e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00213      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0338       |
|    n_updates            | 59020        |
|    policy_gradient_loss | -5.87e-05    |
|    value_loss           | 0.0912       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 717           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5912          |
|    time_elapsed         | 10987         |
|    total_timesteps      | 1513472       |
| train/                  |               |
|    approx_kl            | 3.9231963e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.112        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0338        |
|    n_updates            | 59110         |
|    policy_gradient_loss | -4.96e-05     |
|    value_loss           | 0.0846        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 717          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5921         |
|    time_elapsed         | 11004        |
|    total_timesteps      | 1515776      |
| train/                  |              |
|    approx_kl            | 3.199093e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00169     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0481       |
|    n_updates            | 59200        |
|    policy_gradient_loss | -2.41e-05    |
|    value_loss           | 0.0833       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 717           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5930          |
|    time_elapsed         | 11021         |
|    total_timesteps      | 1518080       |
| train/                  |               |
|    approx_kl            | 1.3969839e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0635       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.115         |
|    n_updates            | 59290         |
|    policy_gradient_loss | -2.29e-05     |
|    value_loss           | 0.257         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 717          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5939         |
|    time_elapsed         | 11039        |
|    total_timesteps      | 1520384      |
| train/                  |              |
|    approx_kl            | 7.422641e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00736     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.118        |
|    n_updates            | 59380        |
|    policy_gradient_loss | -7.74e-05    |
|    value_loss           | 0.222        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 717          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5948         |
|    time_elapsed         | 11056        |
|    total_timesteps      | 1522688      |
| train/                  |              |
|    approx_kl            | 1.497101e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0217       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0413       |
|    n_updates            | 59470        |
|    policy_gradient_loss | -1.39e-05    |
|    value_loss           | 0.0865       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5957          |
|    time_elapsed         | 11073         |
|    total_timesteps      | 1524992       |
| train/                  |               |
|    approx_kl            | 6.2864274e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.318         |
|    learning_rate        | 1e-06         |
|    loss                 | 45.7          |
|    n_updates            | 59560         |
|    policy_gradient_loss | 4.61e-09      |
|    value_loss           | 95.3          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 5967          |
|    time_elapsed         | 11092         |
|    total_timesteps      | 1527552       |
| train/                  |               |
|    approx_kl            | 2.8708018e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0124        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0381        |
|    n_updates            | 59660         |
|    policy_gradient_loss | -2.34e-05     |
|    value_loss           | 0.0866        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 715          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5976         |
|    time_elapsed         | 11109        |
|    total_timesteps      | 1529856      |
| train/                  |              |
|    approx_kl            | 9.075273e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.121        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0379       |
|    n_updates            | 59750        |
|    policy_gradient_loss | -0.000109    |
|    value_loss           | 0.078        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 715          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5985         |
|    time_elapsed         | 11127        |
|    total_timesteps      | 1532160      |
| train/                  |              |
|    approx_kl            | 1.701992e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00515     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0465       |
|    n_updates            | 59840        |
|    policy_gradient_loss | -1.69e-05    |
|    value_loss           | 0.0884       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 715          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 5994         |
|    time_elapsed         | 11144        |
|    total_timesteps      | 1534464      |
| train/                  |              |
|    approx_kl            | 1.718034e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00517      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0929       |
|    n_updates            | 59930        |
|    policy_gradient_loss | -0.000291    |
|    value_loss           | 0.218        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6003          |
|    time_elapsed         | 11161         |
|    total_timesteps      | 1536768       |
| train/                  |               |
|    approx_kl            | 6.2026083e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00259       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0872        |
|    n_updates            | 60020         |
|    policy_gradient_loss | -7.12e-05     |
|    value_loss           | 0.191         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6012          |
|    time_elapsed         | 11178         |
|    total_timesteps      | 1539072       |
| train/                  |               |
|    approx_kl            | 4.9872324e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0204       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0453        |
|    n_updates            | 60110         |
|    policy_gradient_loss | -6.17e-05     |
|    value_loss           | 0.0886        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6021          |
|    time_elapsed         | 11196         |
|    total_timesteps      | 1541376       |
| train/                  |               |
|    approx_kl            | 2.8533395e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0558        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0534        |
|    n_updates            | 60200         |
|    policy_gradient_loss | -0.000102     |
|    value_loss           | 0.134         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6030          |
|    time_elapsed         | 11213         |
|    total_timesteps      | 1543680       |
| train/                  |               |
|    approx_kl            | 1.0966323e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00746      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.06          |
|    n_updates            | 60290         |
|    policy_gradient_loss | -2.76e-05     |
|    value_loss           | 0.132         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6039          |
|    time_elapsed         | 11230         |
|    total_timesteps      | 1545984       |
| train/                  |               |
|    approx_kl            | 1.3667159e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.151         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.035         |
|    n_updates            | 60380         |
|    policy_gradient_loss | -2.97e-05     |
|    value_loss           | 0.0765        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 715          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6048         |
|    time_elapsed         | 11247        |
|    total_timesteps      | 1548288      |
| train/                  |              |
|    approx_kl            | 3.236346e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00297     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0423       |
|    n_updates            | 60470        |
|    policy_gradient_loss | -4.59e-05    |
|    value_loss           | 0.0865       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6057          |
|    time_elapsed         | 11265         |
|    total_timesteps      | 1550592       |
| train/                  |               |
|    approx_kl            | 1.1203811e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.111        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.123         |
|    n_updates            | 60560         |
|    policy_gradient_loss | -4.43e-05     |
|    value_loss           | 0.238         |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 715          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6066         |
|    time_elapsed         | 11282        |
|    total_timesteps      | 1552896      |
| train/                  |              |
|    approx_kl            | 7.744413e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0559      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0971       |
|    n_updates            | 60650        |
|    policy_gradient_loss | -0.000179    |
|    value_loss           | 0.22         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 715           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6075          |
|    time_elapsed         | 11299         |
|    total_timesteps      | 1555200       |
| train/                  |               |
|    approx_kl            | 1.3262033e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00657      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0448        |
|    n_updates            | 60740         |
|    policy_gradient_loss | -5.46e-05     |
|    value_loss           | 0.0878        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 714          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6084         |
|    time_elapsed         | 11316        |
|    total_timesteps      | 1557504      |
| train/                  |              |
|    approx_kl            | 5.052425e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.105       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0478       |
|    n_updates            | 60830        |
|    policy_gradient_loss | -6.23e-05    |
|    value_loss           | 0.102        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 714           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6093          |
|    time_elapsed         | 11333         |
|    total_timesteps      | 1559808       |
| train/                  |               |
|    approx_kl            | 1.0491349e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.163        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0446        |
|    n_updates            | 60920         |
|    policy_gradient_loss | -0.000118     |
|    value_loss           | 0.091         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 714          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6102         |
|    time_elapsed         | 11351        |
|    total_timesteps      | 1562112      |
| train/                  |              |
|    approx_kl            | 7.362105e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0257       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0417       |
|    n_updates            | 61010        |
|    policy_gradient_loss | -6.87e-05    |
|    value_loss           | 0.0902       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 714          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6111         |
|    time_elapsed         | 11368        |
|    total_timesteps      | 1564416      |
| train/                  |              |
|    approx_kl            | 7.050112e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00179     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0475       |
|    n_updates            | 61100        |
|    policy_gradient_loss | -5.84e-05    |
|    value_loss           | 0.104        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 714           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6120          |
|    time_elapsed         | 11386         |
|    total_timesteps      | 1566720       |
| train/                  |               |
|    approx_kl            | 2.0256266e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.21          |
|    learning_rate        | 1e-06         |
|    loss                 | 92.6          |
|    n_updates            | 61190         |
|    policy_gradient_loss | -7.78e-06     |
|    value_loss           | 221           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 714          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6129         |
|    time_elapsed         | 11403        |
|    total_timesteps      | 1569024      |
| train/                  |              |
|    approx_kl            | 5.653128e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00206      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0797       |
|    n_updates            | 61280        |
|    policy_gradient_loss | -8.57e-05    |
|    value_loss           | 0.219        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 714           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6138          |
|    time_elapsed         | 11421         |
|    total_timesteps      | 1571328       |
| train/                  |               |
|    approx_kl            | 5.6042336e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00458       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0648        |
|    n_updates            | 61370         |
|    policy_gradient_loss | -9.87e-05     |
|    value_loss           | 0.136         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 714          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6147         |
|    time_elapsed         | 11438        |
|    total_timesteps      | 1573632      |
| train/                  |              |
|    approx_kl            | 5.858019e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00283     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.037        |
|    n_updates            | 61460        |
|    policy_gradient_loss | -9.93e-05    |
|    value_loss           | 0.0836       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 714           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6156          |
|    time_elapsed         | 11455         |
|    total_timesteps      | 1575936       |
| train/                  |               |
|    approx_kl            | 1.0712538e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00417       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0534        |
|    n_updates            | 61550         |
|    policy_gradient_loss | -0.000133     |
|    value_loss           | 0.091         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 714          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6165         |
|    time_elapsed         | 11472        |
|    total_timesteps      | 1578240      |
| train/                  |              |
|    approx_kl            | 8.100178e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.138       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0398       |
|    n_updates            | 61640        |
|    policy_gradient_loss | -8.87e-05    |
|    value_loss           | 0.0914       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 713          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6175         |
|    time_elapsed         | 11491        |
|    total_timesteps      | 1580800      |
| train/                  |              |
|    approx_kl            | 3.054738e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.225        |
|    learning_rate        | 1e-06        |
|    loss                 | 326          |
|    n_updates            | 61740        |
|    policy_gradient_loss | 1.42e-05     |
|    value_loss           | 619          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 713           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6184          |
|    time_elapsed         | 11509         |
|    total_timesteps      | 1583104       |
| train/                  |               |
|    approx_kl            | 2.0349398e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0155       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0593        |
|    n_updates            | 61830         |
|    policy_gradient_loss | -2.54e-05     |
|    value_loss           | 0.144         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 713           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6193          |
|    time_elapsed         | 11526         |
|    total_timesteps      | 1585408       |
| train/                  |               |
|    approx_kl            | 3.5599805e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0141       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0438        |
|    n_updates            | 61920         |
|    policy_gradient_loss | -4.22e-05     |
|    value_loss           | 0.0937        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 713           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6202          |
|    time_elapsed         | 11543         |
|    total_timesteps      | 1587712       |
| train/                  |               |
|    approx_kl            | 2.3236498e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00191      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0452        |
|    n_updates            | 62010         |
|    policy_gradient_loss | -3.04e-05     |
|    value_loss           | 0.0882        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 713          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6211         |
|    time_elapsed         | 11560        |
|    total_timesteps      | 1590016      |
| train/                  |              |
|    approx_kl            | 6.170012e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00319      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.123        |
|    n_updates            | 62100        |
|    policy_gradient_loss | -9.38e-06    |
|    value_loss           | 0.259        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 713           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6220          |
|    time_elapsed         | 11577         |
|    total_timesteps      | 1592320       |
| train/                  |               |
|    approx_kl            | 2.2933818e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.011        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0754        |
|    n_updates            | 62190         |
|    policy_gradient_loss | -3.18e-05     |
|    value_loss           | 0.246         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 713           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6229          |
|    time_elapsed         | 11594         |
|    total_timesteps      | 1594624       |
| train/                  |               |
|    approx_kl            | 7.6694414e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.156        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0515        |
|    n_updates            | 62280         |
|    policy_gradient_loss | -0.000101     |
|    value_loss           | 0.104         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 717          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6238         |
|    time_elapsed         | 11611        |
|    total_timesteps      | 1596928      |
| train/                  |              |
|    approx_kl            | 9.080395e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00261      |
|    learning_rate        | 1e-06        |
|    loss                 | 562          |
|    n_updates            | 62370        |
|    policy_gradient_loss | 4.7e-08      |
|    value_loss           | 1.11e+03     |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 717           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6247          |
|    time_elapsed         | 11628         |
|    total_timesteps      | 1599232       |
| train/                  |               |
|    approx_kl            | 4.1304156e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.274        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.045         |
|    n_updates            | 62460         |
|    policy_gradient_loss | -5.97e-05     |
|    value_loss           | 0.0947        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 717           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6256          |
|    time_elapsed         | 11646         |
|    total_timesteps      | 1601536       |
| train/                  |               |
|    approx_kl            | 3.1408854e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0111        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0336        |
|    n_updates            | 62550         |
|    policy_gradient_loss | -3.63e-05     |
|    value_loss           | 0.0817        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 717          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6265         |
|    time_elapsed         | 11664        |
|    total_timesteps      | 1603840      |
| train/                  |              |
|    approx_kl            | 3.266614e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.226        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0269       |
|    n_updates            | 62640        |
|    policy_gradient_loss | -4.45e-05    |
|    value_loss           | 0.0662       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 717           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6274          |
|    time_elapsed         | 11681         |
|    total_timesteps      | 1606144       |
| train/                  |               |
|    approx_kl            | 1.2130477e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00387       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0888        |
|    n_updates            | 62730         |
|    policy_gradient_loss | -2.17e-05     |
|    value_loss           | 0.314         |
-------------------------------------------
--------------------------------------------
| rollout/                |    

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 717          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6283         |
|    time_elapsed         | 11698        |
|    total_timesteps      | 1608448      |
| train/                  |              |
|    approx_kl            | 3.548339e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.000198     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.122        |
|    n_updates            | 62820        |
|    policy_gradient_loss | -4.61e-05    |
|    value_loss           | 0.255        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 717          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6292         |
|    time_elapsed         | 11715        |
|    total_timesteps      | 1610752      |
| train/                  |              |
|    approx_kl            | 3.098976e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0914      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0446       |
|    n_updates            | 62910        |
|    policy_gradient_loss | -3.68e-05    |
|    value_loss           | 0.0923       |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.7e+04      |
|    ep_rew_mean          | 717          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6302         |
|    time_elapsed         | 11734        |
|    total_timesteps      | 1613312      |
| train/                  |              |
|    approx_kl            | 2.537854e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.218       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0656       |
|    n_updates            | 63010        |
|    policy_gradient_loss | -6.42e-06    |
|    value_loss           | 0.169        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 717           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6311          |
|    time_elapsed         | 11751         |
|    total_timesteps      | 1615616       |
| train/                  |               |
|    approx_kl            | 2.0465814e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00657      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0413        |
|    n_updates            | 63100         |
|    policy_gradient_loss | -2.99e-05     |
|    value_loss           | 0.108         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 717           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6320          |
|    time_elapsed         | 11768         |
|    total_timesteps      | 1617920       |
| train/                  |               |
|    approx_kl            | 2.3655593e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0959        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0339        |
|    n_updates            | 63190         |
|    policy_gradient_loss | -2.02e-05     |
|    value_loss           | 0.0817        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.7e+04       |
|    ep_rew_mean          | 717           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6329          |
|    time_elapsed         | 11786         |
|    total_timesteps      | 1620224       |
| train/                  |               |
|    approx_kl            | 3.8556755e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0304        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0362        |
|    n_updates            | 63280         |
|    policy_gradient_loss | -3.97e-05     |
|    value_loss           | 0.0882        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6338          |
|    time_elapsed         | 11803         |
|    total_timesteps      | 1622528       |
| train/                  |               |
|    approx_kl            | 2.7916394e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.157         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.048         |
|    n_updates            | 63370         |
|    policy_gradient_loss | -6.16e-05     |
|    value_loss           | 0.114         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6347          |
|    time_elapsed         | 11820         |
|    total_timesteps      | 1624832       |
| train/                  |               |
|    approx_kl            | 8.3609484e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0121        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0551        |
|    n_updates            | 63460         |
|    policy_gradient_loss | -0.000111     |
|    value_loss           | 0.131         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6356          |
|    time_elapsed         | 11837         |
|    total_timesteps      | 1627136       |
| train/                  |               |
|    approx_kl            | 2.7078204e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0222        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0513        |
|    n_updates            | 63550         |
|    policy_gradient_loss | -2.34e-05     |
|    value_loss           | 0.0877        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6365          |
|    time_elapsed         | 11854         |
|    total_timesteps      | 1629440       |
| train/                  |               |
|    approx_kl            | 8.5448846e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.293         |
|    learning_rate        | 1e-06         |
|    loss                 | 102           |
|    n_updates            | 63640         |
|    policy_gradient_loss | -1.68e-05     |
|    value_loss           | 212           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6374          |
|    time_elapsed         | 11872         |
|    total_timesteps      | 1631744       |
| train/                  |               |
|    approx_kl            | 6.8265945e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0109       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.102         |
|    n_updates            | 63730         |
|    policy_gradient_loss | -5.14e-05     |
|    value_loss           | 0.249         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 716           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6383          |
|    time_elapsed         | 11889         |
|    total_timesteps      | 1634048       |
| train/                  |               |
|    approx_kl            | 1.4784746e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0156       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0937        |
|    n_updates            | 63820         |
|    policy_gradient_loss | -3.68e-05     |
|    value_loss           | 0.188         |
-------------------------------------------
--------------------------------------------
| rollout/                |    

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 716          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6392         |
|    time_elapsed         | 11906        |
|    total_timesteps      | 1636352      |
| train/                  |              |
|    approx_kl            | 3.662426e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0827       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0436       |
|    n_updates            | 63910        |
|    policy_gradient_loss | -4.17e-05    |
|    value_loss           | 0.0852       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6401          |
|    time_elapsed         | 11923         |
|    total_timesteps      | 1638656       |
| train/                  |               |
|    approx_kl            | 4.7613867e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00344      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0413        |
|    n_updates            | 64000         |
|    policy_gradient_loss | -4.33e-05     |
|    value_loss           | 0.0881        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6410          |
|    time_elapsed         | 11941         |
|    total_timesteps      | 1640960       |
| train/                  |               |
|    approx_kl            | 1.3760291e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00297      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0391        |
|    n_updates            | 64090         |
|    policy_gradient_loss | -2.63e-05     |
|    value_loss           | 0.096         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 718          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6419         |
|    time_elapsed         | 11958        |
|    total_timesteps      | 1643264      |
| train/                  |              |
|    approx_kl            | 1.557637e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00323     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0395       |
|    n_updates            | 64180        |
|    policy_gradient_loss | -1.12e-05    |
|    value_loss           | 0.0878       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 718          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6429         |
|    time_elapsed         | 11978        |
|    total_timesteps      | 1645824      |
| train/                  |              |
|    approx_kl            | 3.958121e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.117        |
|    learning_rate        | 1e-06        |
|    loss                 | 113          |
|    n_updates            | 64280        |
|    policy_gradient_loss | -8.97e-07    |
|    value_loss           | 239          |
------------------------------------------
--------------------------------------------
| rollout/                |                |
|    ep

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 718          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6438         |
|    time_elapsed         | 11994        |
|    total_timesteps      | 1648128      |
| train/                  |              |
|    approx_kl            | 3.958121e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.311        |
|    learning_rate        | 1e-06        |
|    loss                 | 64           |
|    n_updates            | 64370        |
|    policy_gradient_loss | -1.56e-06    |
|    value_loss           | 108          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6447          |
|    time_elapsed         | 12012         |
|    total_timesteps      | 1650432       |
| train/                  |               |
|    approx_kl            | 1.9813888e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0113        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.118         |
|    n_updates            | 64460         |
|    policy_gradient_loss | -3.95e-05     |
|    value_loss           | 0.244         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6456          |
|    time_elapsed         | 12030         |
|    total_timesteps      | 1652736       |
| train/                  |               |
|    approx_kl            | 7.9046004e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0158        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0581        |
|    n_updates            | 64550         |
|    policy_gradient_loss | -8.94e-05     |
|    value_loss           | 0.0937        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6465          |
|    time_elapsed         | 12047         |
|    total_timesteps      | 1655040       |
| train/                  |               |
|    approx_kl            | 5.4528937e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0303        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0448        |
|    n_updates            | 64640         |
|    policy_gradient_loss | -5.1e-05      |
|    value_loss           | 0.0995        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.71e+04    |
|    ep_rew_mean          | 718         |
| time/                   |             |
|    fps                  | 137         |
|    iterations           | 6474        |
|    time_elapsed         | 12064       |
|    total_timesteps      | 1657344     |
| train/                  |             |
|    approx_kl            | 3.60189e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | -0.0466     |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0461      |
|    n_updates            | 64730       |
|    policy_gradient_loss | -2.16e-05   |
|    value_loss           | 0.088       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6483          |
|    time_elapsed         | 12081         |
|    total_timesteps      | 1659648       |
| train/                  |               |
|    approx_kl            | 8.0210157e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00169      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0453        |
|    n_updates            | 64820         |
|    policy_gradient_loss | -5.59e-05     |
|    value_loss           | 0.0877        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6492          |
|    time_elapsed         | 12099         |
|    total_timesteps      | 1661952       |
| train/                  |               |
|    approx_kl            | 1.2526289e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.169        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0637        |
|    n_updates            | 64910         |
|    policy_gradient_loss | -9.03e-06     |
|    value_loss           | 0.129         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6501          |
|    time_elapsed         | 12116         |
|    total_timesteps      | 1664256       |
| train/                  |               |
|    approx_kl            | 3.3548567e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0615       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.035         |
|    n_updates            | 65000         |
|    policy_gradient_loss | -0.000164     |
|    value_loss           | 0.0923        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6510          |
|    time_elapsed         | 12133         |
|    total_timesteps      | 1666560       |
| train/                  |               |
|    approx_kl            | 2.2700988e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0373        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0414        |
|    n_updates            | 65090         |
|    policy_gradient_loss | -4.09e-05     |
|    value_loss           | 0.0903        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 718          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6519         |
|    time_elapsed         | 12150        |
|    total_timesteps      | 1668864      |
| train/                  |              |
|    approx_kl            | 9.359792e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0568       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0346       |
|    n_updates            | 65180        |
|    policy_gradient_loss | -1.98e-05    |
|    value_loss           | 0.0802       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 718          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6528         |
|    time_elapsed         | 12168        |
|    total_timesteps      | 1671168      |
| train/                  |              |
|    approx_kl            | 3.844034e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.000537    |
|    learning_rate        | 1e-06        |
|    loss                 | 0.105        |
|    n_updates            | 65270        |
|    policy_gradient_loss | -2.86e-05    |
|    value_loss           | 0.211        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6537          |
|    time_elapsed         | 12185         |
|    total_timesteps      | 1673472       |
| train/                  |               |
|    approx_kl            | 8.3679333e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0141       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.129         |
|    n_updates            | 65360         |
|    policy_gradient_loss | -8.93e-05     |
|    value_loss           | 0.214         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6547          |
|    time_elapsed         | 12204         |
|    total_timesteps      | 1676032       |
| train/                  |               |
|    approx_kl            | 1.6461127e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00185      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0554        |
|    n_updates            | 65460         |
|    policy_gradient_loss | -2.38e-05     |
|    value_loss           | 0.0968        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6556          |
|    time_elapsed         | 12221         |
|    total_timesteps      | 1678336       |
| train/                  |               |
|    approx_kl            | 8.4983185e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0322       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0402        |
|    n_updates            | 65550         |
|    policy_gradient_loss | -1.26e-05     |
|    value_loss           | 0.117         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 718          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6565         |
|    time_elapsed         | 12239        |
|    total_timesteps      | 1680640      |
| train/                  |              |
|    approx_kl            | 3.259629e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 1.95e-05     |
|    learning_rate        | 1e-06        |
|    loss                 | 326          |
|    n_updates            | 65640        |
|    policy_gradient_loss | 5.84e-07     |
|    value_loss           | 658          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6574          |
|    time_elapsed         | 12256         |
|    total_timesteps      | 1682944       |
| train/                  |               |
|    approx_kl            | 1.8046703e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.000267     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0439        |
|    n_updates            | 65730         |
|    policy_gradient_loss | -0.000155     |
|    value_loss           | 0.103         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6583          |
|    time_elapsed         | 12273         |
|    total_timesteps      | 1685248       |
| train/                  |               |
|    approx_kl            | 1.6321428e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.148        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0486        |
|    n_updates            | 65820         |
|    policy_gradient_loss | -1.22e-05     |
|    value_loss           | 0.0988        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 718           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6592          |
|    time_elapsed         | 12290         |
|    total_timesteps      | 1687552       |
| train/                  |               |
|    approx_kl            | 5.7350844e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0117        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.107         |
|    n_updates            | 65910         |
|    policy_gradient_loss | -0.000236     |
|    value_loss           | 0.198         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 720           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6601          |
|    time_elapsed         | 12307         |
|    total_timesteps      | 1689856       |
| train/                  |               |
|    approx_kl            | 4.0512532e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.225         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0392        |
|    n_updates            | 66000         |
|    policy_gradient_loss | -7.27e-05     |
|    value_loss           | 0.0882        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 720           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6610          |
|    time_elapsed         | 12325         |
|    total_timesteps      | 1692160       |
| train/                  |               |
|    approx_kl            | 1.4735851e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.006         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0342        |
|    n_updates            | 66090         |
|    policy_gradient_loss | -9.14e-05     |
|    value_loss           | 0.0854        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 720          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6619         |
|    time_elapsed         | 12342        |
|    total_timesteps      | 1694464      |
| train/                  |              |
|    approx_kl            | 6.456394e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.000803     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0629       |
|    n_updates            | 66180        |
|    policy_gradient_loss | -7.06e-05    |
|    value_loss           | 0.123        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 720           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6628          |
|    time_elapsed         | 12359         |
|    total_timesteps      | 1696768       |
| train/                  |               |
|    approx_kl            | 8.1490725e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 4.18e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 429           |
|    n_updates            | 66270         |
|    policy_gradient_loss | 5.95e-06      |
|    value_loss           | 820           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 720          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6637         |
|    time_elapsed         | 12376        |
|    total_timesteps      | 1699072      |
| train/                  |              |
|    approx_kl            | 5.098991e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0527       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.134        |
|    n_updates            | 66360        |
|    policy_gradient_loss | -1.63e-05    |
|    value_loss           | 0.232        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 720          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6646         |
|    time_elapsed         | 12394        |
|    total_timesteps      | 1701376      |
| train/                  |              |
|    approx_kl            | 3.206078e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0271      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.115        |
|    n_updates            | 66450        |
|    policy_gradient_loss | -4.32e-05    |
|    value_loss           | 0.241        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 720           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6655          |
|    time_elapsed         | 12411         |
|    total_timesteps      | 1703680       |
| train/                  |               |
|    approx_kl            | 6.9639646e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0403       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0448        |
|    n_updates            | 66540         |
|    policy_gradient_loss | -7.05e-05     |
|    value_loss           | 0.0878        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 720           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6664          |
|    time_elapsed         | 12428         |
|    total_timesteps      | 1705984       |
| train/                  |               |
|    approx_kl            | 3.4668483e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00427       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0778        |
|    n_updates            | 66630         |
|    policy_gradient_loss | -6.31e-05     |
|    value_loss           | 0.14          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.71e+04    |
|    ep_rew_mean          | 720         |
| time/                   |             |
|    fps                  | 137         |
|    iterations           | 6673        |
|    time_elapsed         | 12445       |
|    total_timesteps      | 1708288     |
| train/                  |             |
|    approx_kl            | 6.07688e-08 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | 0.302       |
|    learning_rate        | 1e-06       |
|    loss                 | 83.4        |
|    n_updates            | 66720       |
|    policy_gradient_loss | 1.26e-06    |
|    value_loss           | 161         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 720          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6683         |
|    time_elapsed         | 12465        |
|    total_timesteps      | 1710848      |
| train/                  |              |
|    approx_kl            | 4.627276e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00143     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0489       |
|    n_updates            | 66820        |
|    policy_gradient_loss | -6.98e-05    |
|    value_loss           | 0.0978       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 721           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6692          |
|    time_elapsed         | 12482         |
|    total_timesteps      | 1713152       |
| train/                  |               |
|    approx_kl            | 1.7462298e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.676        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0408        |
|    n_updates            | 66910         |
|    policy_gradient_loss | -4.62e-06     |
|    value_loss           | 0.155         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 721           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6701          |
|    time_elapsed         | 12498         |
|    total_timesteps      | 1715456       |
| train/                  |               |
|    approx_kl            | 2.7171336e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0548       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0486        |
|    n_updates            | 67000         |
|    policy_gradient_loss | -1.56e-05     |
|    value_loss           | 0.188         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 721           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6710          |
|    time_elapsed         | 12515         |
|    total_timesteps      | 1717760       |
| train/                  |               |
|    approx_kl            | 2.1560118e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0991        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0508        |
|    n_updates            | 67090         |
|    policy_gradient_loss | -1.95e-05     |
|    value_loss           | 0.0901        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 721           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6719          |
|    time_elapsed         | 12533         |
|    total_timesteps      | 1720064       |
| train/                  |               |
|    approx_kl            | 2.1723099e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -6.44e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0509        |
|    n_updates            | 67180         |
|    policy_gradient_loss | -1.34e-05     |
|    value_loss           | 0.0976        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 727          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6728         |
|    time_elapsed         | 12550        |
|    total_timesteps      | 1722368      |
| train/                  |              |
|    approx_kl            | 9.778887e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.243        |
|    learning_rate        | 1e-06        |
|    loss                 | 7.15         |
|    n_updates            | 67270        |
|    policy_gradient_loss | 4.77e-06     |
|    value_loss           | 20.3         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 727           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6737          |
|    time_elapsed         | 12567         |
|    total_timesteps      | 1724672       |
| train/                  |               |
|    approx_kl            | 1.2065284e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0148       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0404        |
|    n_updates            | 67360         |
|    policy_gradient_loss | -0.000106     |
|    value_loss           | 0.094         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 727           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6746          |
|    time_elapsed         | 12584         |
|    total_timesteps      | 1726976       |
| train/                  |               |
|    approx_kl            | 4.8661605e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0818        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0406        |
|    n_updates            | 67450         |
|    policy_gradient_loss | -5.26e-05     |
|    value_loss           | 0.0816        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 727           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6756          |
|    time_elapsed         | 12603         |
|    total_timesteps      | 1729536       |
| train/                  |               |
|    approx_kl            | 7.9954043e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0317        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0408        |
|    n_updates            | 67550         |
|    policy_gradient_loss | -6.85e-05     |
|    value_loss           | 0.0846        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 731           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6765          |
|    time_elapsed         | 12621         |
|    total_timesteps      | 1731840       |
| train/                  |               |
|    approx_kl            | 4.2375177e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00371       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0464        |
|    n_updates            | 67640         |
|    policy_gradient_loss | -1.35e-05     |
|    value_loss           | 0.291         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 731           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6774          |
|    time_elapsed         | 12638         |
|    total_timesteps      | 1734144       |
| train/                  |               |
|    approx_kl            | 1.4388934e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0499        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0446        |
|    n_updates            | 67730         |
|    policy_gradient_loss | -3.05e-05     |
|    value_loss           | 0.208         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 731           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6783          |
|    time_elapsed         | 12655         |
|    total_timesteps      | 1736448       |
| train/                  |               |
|    approx_kl            | 1.5669502e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0402       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0433        |
|    n_updates            | 67820         |
|    policy_gradient_loss | -2.73e-05     |
|    value_loss           | 0.0954        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 731           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6792          |
|    time_elapsed         | 12672         |
|    total_timesteps      | 1738752       |
| train/                  |               |
|    approx_kl            | 4.1956082e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0204       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0589        |
|    n_updates            | 67910         |
|    policy_gradient_loss | -1.87e-05     |
|    value_loss           | 0.0995        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 731           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6801          |
|    time_elapsed         | 12690         |
|    total_timesteps      | 1741056       |
| train/                  |               |
|    approx_kl            | 2.9802322e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0131        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0976        |
|    n_updates            | 68000         |
|    policy_gradient_loss | -3.28e-05     |
|    value_loss           | 0.228         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 731           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6810          |
|    time_elapsed         | 12707         |
|    total_timesteps      | 1743360       |
| train/                  |               |
|    approx_kl            | 3.6903657e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00249       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.135         |
|    n_updates            | 68090         |
|    policy_gradient_loss | -3.86e-05     |
|    value_loss           | 0.257         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 731           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6819          |
|    time_elapsed         | 12724         |
|    total_timesteps      | 1745664       |
| train/                  |               |
|    approx_kl            | 3.5832636e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.052        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0523        |
|    n_updates            | 68180         |
|    policy_gradient_loss | -4.34e-05     |
|    value_loss           | 0.0872        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 731          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6828         |
|    time_elapsed         | 12741        |
|    total_timesteps      | 1747968      |
| train/                  |              |
|    approx_kl            | 4.004687e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.155       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0474       |
|    n_updates            | 68270        |
|    policy_gradient_loss | -7.54e-05    |
|    value_loss           | 0.0944       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 735          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6837         |
|    time_elapsed         | 12759        |
|    total_timesteps      | 1750272      |
| train/                  |              |
|    approx_kl            | 1.678709e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.049        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0394       |
|    n_updates            | 68360        |
|    policy_gradient_loss | -3.2e-05     |
|    value_loss           | 0.0762       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 735           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6847          |
|    time_elapsed         | 12778         |
|    total_timesteps      | 1752832       |
| train/                  |               |
|    approx_kl            | 1.1834782e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00701       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0401        |
|    n_updates            | 68460         |
|    policy_gradient_loss | -0.000101     |
|    value_loss           | 0.0881        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 735           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6856          |
|    time_elapsed         | 12795         |
|    total_timesteps      | 1755136       |
| train/                  |               |
|    approx_kl            | 1.6577542e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0594        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0434        |
|    n_updates            | 68550         |
|    policy_gradient_loss | -3.14e-05     |
|    value_loss           | 0.0926        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 735          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6865         |
|    time_elapsed         | 12812        |
|    total_timesteps      | 1757440      |
| train/                  |              |
|    approx_kl            | 9.778887e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00166      |
|    learning_rate        | 1e-06        |
|    loss                 | 450          |
|    n_updates            | 68640        |
|    policy_gradient_loss | 1.64e-06     |
|    value_loss           | 872          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 735          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6874         |
|    time_elapsed         | 12829        |
|    total_timesteps      | 1759744      |
| train/                  |              |
|    approx_kl            | 3.944151e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0357      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0906       |
|    n_updates            | 68730        |
|    policy_gradient_loss | -3.57e-05    |
|    value_loss           | 0.235        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 735          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6883         |
|    time_elapsed         | 12847        |
|    total_timesteps      | 1762048      |
| train/                  |              |
|    approx_kl            | 2.943445e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0248       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.126        |
|    n_updates            | 68820        |
|    policy_gradient_loss | -0.000305    |
|    value_loss           | 0.235        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 735          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6892         |
|    time_elapsed         | 12864        |
|    total_timesteps      | 1764352      |
| train/                  |              |
|    approx_kl            | 8.312054e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00157      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0524       |
|    n_updates            | 68910        |
|    policy_gradient_loss | -7.01e-05    |
|    value_loss           | 0.0945       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68e+04     |
|    ep_rew_mean          | 735          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6902         |
|    time_elapsed         | 12883        |
|    total_timesteps      | 1766912      |
| train/                  |              |
|    approx_kl            | 2.243556e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0672      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0604       |
|    n_updates            | 69010        |
|    policy_gradient_loss | -6.24e-05    |
|    value_loss           | 0.0981       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.68e+04      |
|    ep_rew_mean          | 735           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6912          |
|    time_elapsed         | 12902         |
|    total_timesteps      | 1769472       |
| train/                  |               |
|    approx_kl            | 1.1825468e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00925      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0477        |
|    n_updates            | 69110         |
|    policy_gradient_loss | -0.000124     |
|    value_loss           | 0.0869        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.68e+04    |
|    ep_rew_mean          | 735         |
| time/                   |             |
|    fps                  | 137         |
|    iterations           | 6921        |
|    time_elapsed         | 12920       |
|    total_timesteps      | 1771776     |
| train/                  |             |
|    approx_kl            | 4.02797e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | -0.000193   |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0352      |
|    n_updates            | 69200       |
|    policy_gradient_loss | -3.71e-05   |
|    value_loss           | 0.088       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.68

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 734           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6930          |
|    time_elapsed         | 12937         |
|    total_timesteps      | 1774080       |
| train/                  |               |
|    approx_kl            | 2.7997885e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0464       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.057         |
|    n_updates            | 69290         |
|    policy_gradient_loss | -0.000202     |
|    value_loss           | 0.212         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 734          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6939         |
|    time_elapsed         | 12954        |
|    total_timesteps      | 1776384      |
| train/                  |              |
|    approx_kl            | 8.731149e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0278       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0318       |
|    n_updates            | 69380        |
|    policy_gradient_loss | -5.92e-06    |
|    value_loss           | 0.0955       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.69e+04    |
|    ep_rew_mean          | 734         |
| time/                   |             |
|    fps                  | 137         |
|    iterations           | 6948        |
|    time_elapsed         | 12971       |
|    total_timesteps      | 1778688     |
| train/                  |             |
|    approx_kl            | 3.45055e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | -0.0264     |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0432      |
|    n_updates            | 69470       |
|    policy_gradient_loss | -3.54e-05   |
|    value_loss           | 0.105       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 734           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6957          |
|    time_elapsed         | 12989         |
|    total_timesteps      | 1780992       |
| train/                  |               |
|    approx_kl            | 7.7090226e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -3.22e-05     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0526        |
|    n_updates            | 69560         |
|    policy_gradient_loss | -7.73e-05     |
|    value_loss           | 0.0934        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 734           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6966          |
|    time_elapsed         | 13006         |
|    total_timesteps      | 1783296       |
| train/                  |               |
|    approx_kl            | 1.3364479e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.028         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0791        |
|    n_updates            | 69650         |
|    policy_gradient_loss | -6.97e-06     |
|    value_loss           | 0.197         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 734          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6975         |
|    time_elapsed         | 13023        |
|    total_timesteps      | 1785600      |
| train/                  |              |
|    approx_kl            | 5.806796e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.000833     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0936       |
|    n_updates            | 69740        |
|    policy_gradient_loss | -7.35e-05    |
|    value_loss           | 0.235        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 734           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 6985          |
|    time_elapsed         | 13042         |
|    total_timesteps      | 1788160       |
| train/                  |               |
|    approx_kl            | 3.2922253e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00471       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0472        |
|    n_updates            | 69840         |
|    policy_gradient_loss | -3.88e-05     |
|    value_loss           | 0.0925        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 734          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 6994         |
|    time_elapsed         | 13060        |
|    total_timesteps      | 1790464      |
| train/                  |              |
|    approx_kl            | 4.407484e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0265      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0544       |
|    n_updates            | 69930        |
|    policy_gradient_loss | -5.66e-05    |
|    value_loss           | 0.0998       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.69e+04     |
|    ep_rew_mean          | 734          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 7004         |
|    time_elapsed         | 13079        |
|    total_timesteps      | 1793024      |
| train/                  |              |
|    approx_kl            | 1.143897e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0351       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0606       |
|    n_updates            | 70030        |
|    policy_gradient_loss | -0.000185    |
|    value_loss           | 0.0943       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.69e+04      |
|    ep_rew_mean          | 734           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7013          |
|    time_elapsed         | 13096         |
|    total_timesteps      | 1795328       |
| train/                  |               |
|    approx_kl            | 3.4202822e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.000382     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0424        |
|    n_updates            | 70120         |
|    policy_gradient_loss | -2.25e-05     |
|    value_loss           | 0.0975        |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 734           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7023          |
|    time_elapsed         | 13115         |
|    total_timesteps      | 1797888       |
| train/                  |               |
|    approx_kl            | 1.3271347e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0727       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.039         |
|    n_updates            | 70220         |
|    policy_gradient_loss | -5.64e-06     |
|    value_loss           | 0.139         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 734           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7032          |
|    time_elapsed         | 13133         |
|    total_timesteps      | 1800192       |
| train/                  |               |
|    approx_kl            | 3.7881546e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00346       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.045         |
|    n_updates            | 70310         |
|    policy_gradient_loss | -4.12e-05     |
|    value_loss           | 0.0936        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 734          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 7041         |
|    time_elapsed         | 13150        |
|    total_timesteps      | 1802496      |
| train/                  |              |
|    approx_kl            | 6.973278e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.000248     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0312       |
|    n_updates            | 70400        |
|    policy_gradient_loss | -8.21e-05    |
|    value_loss           | 0.0901       |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 734           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7050          |
|    time_elapsed         | 13167         |
|    total_timesteps      | 1804800       |
| train/                  |               |
|    approx_kl            | 1.8835999e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0169        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0494        |
|    n_updates            | 70490         |
|    policy_gradient_loss | -2.08e-05     |
|    value_loss           | 0.097         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 734           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7059          |
|    time_elapsed         | 13184         |
|    total_timesteps      | 1807104       |
| train/                  |               |
|    approx_kl            | 3.8649887e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.328         |
|    learning_rate        | 1e-06         |
|    loss                 | 82.5          |
|    n_updates            | 70580         |
|    policy_gradient_loss | -5.62e-06     |
|    value_loss           | 172           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 734          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 7068         |
|    time_elapsed         | 13201        |
|    total_timesteps      | 1809408      |
| train/                  |              |
|    approx_kl            | 1.329463e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0112      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.114        |
|    n_updates            | 70670        |
|    policy_gradient_loss | -1.57e-05    |
|    value_loss           | 0.214        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 734          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 7077         |
|    time_elapsed         | 13219        |
|    total_timesteps      | 1811712      |
| train/                  |              |
|    approx_kl            | 3.790483e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.136        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0359       |
|    n_updates            | 70760        |
|    policy_gradient_loss | -5.17e-05    |
|    value_loss           | 0.103        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 737           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7086          |
|    time_elapsed         | 13236         |
|    total_timesteps      | 1814016       |
| train/                  |               |
|    approx_kl            | 6.7520887e-09 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0613        |
|    learning_rate        | 1e-06         |
|    loss                 | 522           |
|    n_updates            | 70850         |
|    policy_gradient_loss | -6.32e-07     |
|    value_loss           | 909           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 737           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7095          |
|    time_elapsed         | 13253         |
|    total_timesteps      | 1816320       |
| train/                  |               |
|    approx_kl            | 1.2363307e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0725        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0506        |
|    n_updates            | 70940         |
|    policy_gradient_loss | -2.81e-05     |
|    value_loss           | 0.0886        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 737          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 7104         |
|    time_elapsed         | 13270        |
|    total_timesteps      | 1818624      |
| train/                  |              |
|    approx_kl            | 8.896459e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0581      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0522       |
|    n_updates            | 71030        |
|    policy_gradient_loss | -8.89e-05    |
|    value_loss           | 0.0967       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 737          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 7113         |
|    time_elapsed         | 13288        |
|    total_timesteps      | 1820928      |
| train/                  |              |
|    approx_kl            | 4.656613e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.141        |
|    learning_rate        | 1e-06        |
|    loss                 | 521          |
|    n_updates            | 71120        |
|    policy_gradient_loss | -4.61e-07    |
|    value_loss           | 999          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 737          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 7122         |
|    time_elapsed         | 13305        |
|    total_timesteps      | 1823232      |
| train/                  |              |
|    approx_kl            | 1.839362e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.302        |
|    learning_rate        | 1e-06        |
|    loss                 | 75.8         |
|    n_updates            | 71210        |
|    policy_gradient_loss | 1.45e-05     |
|    value_loss           | 161          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 737           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7131          |
|    time_elapsed         | 13322         |
|    total_timesteps      | 1825536       |
| train/                  |               |
|    approx_kl            | 4.4656917e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00179      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.12          |
|    n_updates            | 71300         |
|    policy_gradient_loss | -5.35e-05     |
|    value_loss           | 0.231         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 737           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7140          |
|    time_elapsed         | 13339         |
|    total_timesteps      | 1827840       |
| train/                  |               |
|    approx_kl            | 2.9872172e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0647       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0618        |
|    n_updates            | 71390         |
|    policy_gradient_loss | -3.6e-05      |
|    value_loss           | 0.154         |
-------------------------------------------
--------------------------------------------
| rollout/                |    

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.71e+04    |
|    ep_rew_mean          | 742         |
| time/                   |             |
|    fps                  | 137         |
|    iterations           | 7149        |
|    time_elapsed         | 13357       |
|    total_timesteps      | 1830144     |
| train/                  |             |
|    approx_kl            | 4.33065e-08 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | -0.324      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0414      |
|    n_updates            | 71480       |
|    policy_gradient_loss | -4.74e-06   |
|    value_loss           | 0.198       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 742          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 7159         |
|    time_elapsed         | 13375        |
|    total_timesteps      | 1832704      |
| train/                  |              |
|    approx_kl            | 9.709038e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.466       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0782       |
|    n_updates            | 71580        |
|    policy_gradient_loss | -2.34e-05    |
|    value_loss           | 0.208        |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 742          |
| time/                   |              |
|    fps                  | 137          |
|    iterations           | 7168         |
|    time_elapsed         | 13392        |
|    total_timesteps      | 1835008      |
| train/                  |              |
|    approx_kl            | 3.760215e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00677     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0426       |
|    n_updates            | 71670        |
|    policy_gradient_loss | -5.72e-05    |
|    value_loss           | 0.0903       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 742           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7177          |
|    time_elapsed         | 13409         |
|    total_timesteps      | 1837312       |
| train/                  |               |
|    approx_kl            | 2.1327287e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.215        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0509        |
|    n_updates            | 71760         |
|    policy_gradient_loss | -2.05e-05     |
|    value_loss           | 0.119         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 742           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7186          |
|    time_elapsed         | 13426         |
|    total_timesteps      | 1839616       |
| train/                  |               |
|    approx_kl            | 1.5599653e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0336        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0967        |
|    n_updates            | 71850         |
|    policy_gradient_loss | -4.09e-06     |
|    value_loss           | 0.313         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 742           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7195          |
|    time_elapsed         | 13444         |
|    total_timesteps      | 1841920       |
| train/                  |               |
|    approx_kl            | 2.9196963e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.03          |
|    learning_rate        | 1e-06         |
|    loss                 | 0.116         |
|    n_updates            | 71940         |
|    policy_gradient_loss | -2.67e-05     |
|    value_loss           | 0.205         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 742           |
| time/                   |               |
|    fps                  | 137           |
|    iterations           | 7204          |
|    time_elapsed         | 13461         |
|    total_timesteps      | 1844224       |
| train/                  |               |
|    approx_kl            | 3.8882717e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.149        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0433        |
|    n_updates            | 72030         |
|    policy_gradient_loss | -5.23e-05     |
|    value_loss           | 0.0993        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 742           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7213          |
|    time_elapsed         | 13478         |
|    total_timesteps      | 1846528       |
| train/                  |               |
|    approx_kl            | 1.3739336e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0463       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0487        |
|    n_updates            | 72120         |
|    policy_gradient_loss | -0.000157     |
|    value_loss           | 0.0904        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 746           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7222          |
|    time_elapsed         | 13495         |
|    total_timesteps      | 1848832       |
| train/                  |               |
|    approx_kl            | 1.3271347e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.391         |
|    learning_rate        | 1e-06         |
|    loss                 | 1.93          |
|    n_updates            | 72210         |
|    policy_gradient_loss | -4.08e-06     |
|    value_loss           | 4.64          |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.71e+04    |
|    ep_rew_mean          | 746         |
| time/                   |             |
|    fps                  | 136         |
|    iterations           | 7231        |
|    time_elapsed         | 13513       |
|    total_timesteps      | 1851136     |
| train/                  |             |
|    approx_kl            | 6.64033e-07 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.84       |
|    explained_variance   | -0.196      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0552      |
|    n_updates            | 72300       |
|    policy_gradient_loss | -8.9e-05    |
|    value_loss           | 0.114       |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 746           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7241          |
|    time_elapsed         | 13532         |
|    total_timesteps      | 1853696       |
| train/                  |               |
|    approx_kl            | 1.4249235e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0543        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0427        |
|    n_updates            | 72400         |
|    policy_gradient_loss | -8.08e-06     |
|    value_loss           | 0.0837        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 746           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7250          |
|    time_elapsed         | 13549         |
|    total_timesteps      | 1856000       |
| train/                  |               |
|    approx_kl            | 4.5378692e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.122        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0892        |
|    n_updates            | 72490         |
|    policy_gradient_loss | -3.85e-05     |
|    value_loss           | 0.237         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 746           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7259          |
|    time_elapsed         | 13566         |
|    total_timesteps      | 1858304       |
| train/                  |               |
|    approx_kl            | 4.8428774e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0134       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.137         |
|    n_updates            | 72580         |
|    policy_gradient_loss | -6.76e-05     |
|    value_loss           | 0.238         |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 746           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7268          |
|    time_elapsed         | 13584         |
|    total_timesteps      | 1860608       |
| train/                  |               |
|    approx_kl            | 1.0288786e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.000593     |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0421        |
|    n_updates            | 72670         |
|    policy_gradient_loss | -0.000122     |
|    value_loss           | 0.0908        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 748           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7277          |
|    time_elapsed         | 13601         |
|    total_timesteps      | 1862912       |
| train/                  |               |
|    approx_kl            | 3.2037497e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00274       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0684        |
|    n_updates            | 72760         |
|    policy_gradient_loss | -4.92e-05     |
|    value_loss           | 0.127         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 748          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7286         |
|    time_elapsed         | 13618        |
|    total_timesteps      | 1865216      |
| train/                  |              |
|    approx_kl            | 5.378388e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00778     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.07         |
|    n_updates            | 72850        |
|    policy_gradient_loss | -5.69e-05    |
|    value_loss           | 0.13         |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 748           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7295          |
|    time_elapsed         | 13635         |
|    total_timesteps      | 1867520       |
| train/                  |               |
|    approx_kl            | 1.2340024e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.337         |
|    learning_rate        | 1e-06         |
|    loss                 | 82.6          |
|    n_updates            | 72940         |
|    policy_gradient_loss | 1.15e-05      |
|    value_loss           | 178           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 748           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7304          |
|    time_elapsed         | 13652         |
|    total_timesteps      | 1869824       |
| train/                  |               |
|    approx_kl            | 3.3946708e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00221      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.042         |
|    n_updates            | 73030         |
|    policy_gradient_loss | -4.11e-05     |
|    value_loss           | 0.0878        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 748          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7313         |
|    time_elapsed         | 13670        |
|    total_timesteps      | 1872128      |
| train/                  |              |
|    approx_kl            | 6.402843e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.064       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.115        |
|    n_updates            | 73120        |
|    policy_gradient_loss | -4.46e-06    |
|    value_loss           | 0.321        |
------------------------------------------
--------------------------------------------
| rollout/                |                |
|    ep

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 748           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7322          |
|    time_elapsed         | 13687         |
|    total_timesteps      | 1874432       |
| train/                  |               |
|    approx_kl            | 5.0873496e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 4.66e-05      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.1           |
|    n_updates            | 73210         |
|    policy_gradient_loss | -5.33e-05     |
|    value_loss           | 0.227         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 748          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7331         |
|    time_elapsed         | 13704        |
|    total_timesteps      | 1876736      |
| train/                  |              |
|    approx_kl            | 6.472692e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.261       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0573       |
|    n_updates            | 73300        |
|    policy_gradient_loss | -1.27e-05    |
|    value_loss           | 0.109        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 749           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7341          |
|    time_elapsed         | 13723         |
|    total_timesteps      | 1879296       |
| train/                  |               |
|    approx_kl            | 1.9837171e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0798        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0408        |
|    n_updates            | 73400         |
|    policy_gradient_loss | -4.39e-05     |
|    value_loss           | 0.0822        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 749           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7350          |
|    time_elapsed         | 13741         |
|    total_timesteps      | 1881600       |
| train/                  |               |
|    approx_kl            | 8.5448846e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0848        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0364        |
|    n_updates            | 73490         |
|    policy_gradient_loss | -1.46e-05     |
|    value_loss           | 0.0814        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 749           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7359          |
|    time_elapsed         | 13758         |
|    total_timesteps      | 1883904       |
| train/                  |               |
|    approx_kl            | 1.8929131e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00101      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0375        |
|    n_updates            | 73580         |
|    policy_gradient_loss | -8.97e-06     |
|    value_loss           | 0.0964        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 749          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7369         |
|    time_elapsed         | 13778        |
|    total_timesteps      | 1886464      |
| train/                  |              |
|    approx_kl            | 4.840549e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0721      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0405       |
|    n_updates            | 73680        |
|    policy_gradient_loss | -6.23e-05    |
|    value_loss           | 0.0925       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 749           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7379          |
|    time_elapsed         | 13797         |
|    total_timesteps      | 1889024       |
| train/                  |               |
|    approx_kl            | 1.9487925e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00018       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.177         |
|    n_updates            | 73780         |
|    policy_gradient_loss | -5.3e-05      |
|    value_loss           | 0.258         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 749           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7388          |
|    time_elapsed         | 13815         |
|    total_timesteps      | 1891328       |
| train/                  |               |
|    approx_kl            | 2.4936162e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0164       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0817        |
|    n_updates            | 73870         |
|    policy_gradient_loss | -3.49e-05     |
|    value_loss           | 0.214         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 749          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7397         |
|    time_elapsed         | 13832        |
|    total_timesteps      | 1893632      |
| train/                  |              |
|    approx_kl            | 6.784685e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.000376     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0453       |
|    n_updates            | 73960        |
|    policy_gradient_loss | -4.98e-05    |
|    value_loss           | 0.0877       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.72e+04      |
|    ep_rew_mean          | 748           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7406          |
|    time_elapsed         | 13849         |
|    total_timesteps      | 1895936       |
| train/                  |               |
|    approx_kl            | 1.1175871e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0553        |
|    learning_rate        | 1e-06         |
|    loss                 | 231           |
|    n_updates            | 74050         |
|    policy_gradient_loss | 1.39e-06      |
|    value_loss           | 480           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.72e+04     |
|    ep_rew_mean          | 748          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7415         |
|    time_elapsed         | 13866        |
|    total_timesteps      | 1898240      |
| train/                  |              |
|    approx_kl            | 3.655441e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.000209     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0424       |
|    n_updates            | 74140        |
|    policy_gradient_loss | -6.94e-06    |
|    value_loss           | 0.108        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.72e+04     |
|    ep_rew_mean          | 748          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7424         |
|    time_elapsed         | 13884        |
|    total_timesteps      | 1900544      |
| train/                  |              |
|    approx_kl            | 3.243331e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0138      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0326       |
|    n_updates            | 74230        |
|    policy_gradient_loss | -5.01e-05    |
|    value_loss           | 0.0896       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.72e+04     |
|    ep_rew_mean          | 748          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7433         |
|    time_elapsed         | 13901        |
|    total_timesteps      | 1902848      |
| train/                  |              |
|    approx_kl            | 7.012859e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00503      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0446       |
|    n_updates            | 74320        |
|    policy_gradient_loss | -6.94e-05    |
|    value_loss           | 0.0939       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.72e+04     |
|    ep_rew_mean          | 748          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7442         |
|    time_elapsed         | 13918        |
|    total_timesteps      | 1905152      |
| train/                  |              |
|    approx_kl            | 5.727634e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00198      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.104        |
|    n_updates            | 74410        |
|    policy_gradient_loss | -5.53e-06    |
|    value_loss           | 0.229        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 753          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7451         |
|    time_elapsed         | 13935        |
|    total_timesteps      | 1907456      |
| train/                  |              |
|    approx_kl            | 7.683411e-09 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 9.95e-06     |
|    learning_rate        | 1e-06        |
|    loss                 | 274          |
|    n_updates            | 74500        |
|    policy_gradient_loss | -2.78e-07    |
|    value_loss           | 535          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 753          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7460         |
|    time_elapsed         | 13952        |
|    total_timesteps      | 1909760      |
| train/                  |              |
|    approx_kl            | 1.215376e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.275       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0421       |
|    n_updates            | 74590        |
|    policy_gradient_loss | -1.43e-05    |
|    value_loss           | 0.101        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.71e+04   |
|    ep_rew_mean          | 753        |
| time/                   |            |
|    fps                  | 136        |
|    iterations           | 7470       |
|    time_elapsed         | 13972      |
|    total_timesteps      | 1912320    |
| train/                  |            |
|    approx_kl            | 2.8871e-07 |
|    clip_fraction        | 0          |
|    clip_range           | 0.2        |
|    entropy_loss         | -1.84      |
|    explained_variance   | 0.0427     |
|    learning_rate        | 1e-06      |
|    loss                 | 0.043      |
|    n_updates            | 74690      |
|    policy_gradient_loss | -4.45e-05  |
|    value_loss           | 0.0832     |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_re

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 753          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7480         |
|    time_elapsed         | 13991        |
|    total_timesteps      | 1914880      |
| train/                  |              |
|    approx_kl            | 3.532041e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0611      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.046        |
|    n_updates            | 74790        |
|    policy_gradient_loss | -2.45e-05    |
|    value_loss           | 0.0936       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 753          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7489         |
|    time_elapsed         | 14008        |
|    total_timesteps      | 1917184      |
| train/                  |              |
|    approx_kl            | 6.589107e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0384       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0752       |
|    n_updates            | 74880        |
|    policy_gradient_loss | -1.26e-05    |
|    value_loss           | 0.225        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 753          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7498         |
|    time_elapsed         | 14025        |
|    total_timesteps      | 1919488      |
| train/                  |              |
|    approx_kl            | 2.773013e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00712     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0964       |
|    n_updates            | 74970        |
|    policy_gradient_loss | -5.16e-05    |
|    value_loss           | 0.231        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 753           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7507          |
|    time_elapsed         | 14043         |
|    total_timesteps      | 1921792       |
| train/                  |               |
|    approx_kl            | 1.8812716e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.116        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0528        |
|    n_updates            | 75060         |
|    policy_gradient_loss | -2.71e-05     |
|    value_loss           | 0.0972        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 753           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7516          |
|    time_elapsed         | 14060         |
|    total_timesteps      | 1924096       |
| train/                  |               |
|    approx_kl            | 1.9092113e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.297         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0293        |
|    n_updates            | 75150         |
|    policy_gradient_loss | -1.26e-05     |
|    value_loss           | 0.0935        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 753           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7525          |
|    time_elapsed         | 14077         |
|    total_timesteps      | 1926400       |
| train/                  |               |
|    approx_kl            | 3.6275014e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0444        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0399        |
|    n_updates            | 75240         |
|    policy_gradient_loss | -4.74e-05     |
|    value_loss           | 0.0865        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 753           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7534          |
|    time_elapsed         | 14094         |
|    total_timesteps      | 1928704       |
| train/                  |               |
|    approx_kl            | 5.1921234e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.211        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0612        |
|    n_updates            | 75330         |
|    policy_gradient_loss | -4.62e-06     |
|    value_loss           | 0.122         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 753          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7543         |
|    time_elapsed         | 14112        |
|    total_timesteps      | 1931008      |
| train/                  |              |
|    approx_kl            | 1.701992e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.202        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0386       |
|    n_updates            | 75420        |
|    policy_gradient_loss | -2.59e-05    |
|    value_loss           | 0.0679       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.72e+04      |
|    ep_rew_mean          | 751           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7553          |
|    time_elapsed         | 14131         |
|    total_timesteps      | 1933568       |
| train/                  |               |
|    approx_kl            | 2.7311035e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.223         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0293        |
|    n_updates            | 75520         |
|    policy_gradient_loss | -4.67e-05     |
|    value_loss           | 0.067         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.72e+04      |
|    ep_rew_mean          | 751           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7562          |
|    time_elapsed         | 14148         |
|    total_timesteps      | 1935872       |
| train/                  |               |
|    approx_kl            | 2.7101487e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0366        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0374        |
|    n_updates            | 75610         |
|    policy_gradient_loss | -3.56e-05     |
|    value_loss           | 0.0908        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.72e+04     |
|    ep_rew_mean          | 751          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7571         |
|    time_elapsed         | 14165        |
|    total_timesteps      | 1938176      |
| train/                  |              |
|    approx_kl            | 9.010546e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0386      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0563       |
|    n_updates            | 75700        |
|    policy_gradient_loss | -0.000121    |
|    value_loss           | 0.109        |
------------------------------------------
--------------------------------------------
| rollout/                |                |
|    ep

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.72e+04      |
|    ep_rew_mean          | 751           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7581          |
|    time_elapsed         | 14185         |
|    total_timesteps      | 1940736       |
| train/                  |               |
|    approx_kl            | 3.2084063e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.14         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.144         |
|    n_updates            | 75800         |
|    policy_gradient_loss | -4.62e-05     |
|    value_loss           | 0.28          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.72e+04     |
|    ep_rew_mean          | 751          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7591         |
|    time_elapsed         | 14204        |
|    total_timesteps      | 1943296      |
| train/                  |              |
|    approx_kl            | 6.388873e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0278      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.106        |
|    n_updates            | 75900        |
|    policy_gradient_loss | -6.53e-05    |
|    value_loss           | 0.275        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.72e+04      |
|    ep_rew_mean          | 757           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7600          |
|    time_elapsed         | 14221         |
|    total_timesteps      | 1945600       |
| train/                  |               |
|    approx_kl            | 1.7671846e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0383        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0603        |
|    n_updates            | 75990         |
|    policy_gradient_loss | -7.01e-06     |
|    value_loss           | 0.0962        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.72e+04      |
|    ep_rew_mean          | 757           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7609          |
|    time_elapsed         | 14238         |
|    total_timesteps      | 1947904       |
| train/                  |               |
|    approx_kl            | 5.4831617e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.139         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0359        |
|    n_updates            | 76080         |
|    policy_gradient_loss | -7.28e-05     |
|    value_loss           | 0.0719        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.72e+04      |
|    ep_rew_mean          | 757           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7618          |
|    time_elapsed         | 14256         |
|    total_timesteps      | 1950208       |
| train/                  |               |
|    approx_kl            | 2.4284236e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.255        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.055         |
|    n_updates            | 76170         |
|    policy_gradient_loss | -4.47e-05     |
|    value_loss           | 0.106         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.72e+04      |
|    ep_rew_mean          | 757           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7627          |
|    time_elapsed         | 14273         |
|    total_timesteps      | 1952512       |
| train/                  |               |
|    approx_kl            | 7.2829425e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0163        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0478        |
|    n_updates            | 76260         |
|    policy_gradient_loss | -0.000141     |
|    value_loss           | 0.0967        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.72e+04     |
|    ep_rew_mean          | 757          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7636         |
|    time_elapsed         | 14290        |
|    total_timesteps      | 1954816      |
| train/                  |              |
|    approx_kl            | 7.706694e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.00775     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.219        |
|    n_updates            | 76350        |
|    policy_gradient_loss | -4.42e-05    |
|    value_loss           | 0.433        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.72e+04      |
|    ep_rew_mean          | 757           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7645          |
|    time_elapsed         | 14307         |
|    total_timesteps      | 1957120       |
| train/                  |               |
|    approx_kl            | 3.9301813e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.00463      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0952        |
|    n_updates            | 76440         |
|    policy_gradient_loss | -4.86e-05     |
|    value_loss           | 0.222         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.72e+04     |
|    ep_rew_mean          | 757          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7654         |
|    time_elapsed         | 14324        |
|    total_timesteps      | 1959424      |
| train/                  |              |
|    approx_kl            | 2.856832e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00023      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0429       |
|    n_updates            | 76530        |
|    policy_gradient_loss | -0.000194    |
|    value_loss           | 0.114        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.72e+04     |
|    ep_rew_mean          | 757          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7663         |
|    time_elapsed         | 14342        |
|    total_timesteps      | 1961728      |
| train/                  |              |
|    approx_kl            | 6.342307e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0126       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0511       |
|    n_updates            | 76620        |
|    policy_gradient_loss | -5.66e-05    |
|    value_loss           | 0.0988       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 756          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7672         |
|    time_elapsed         | 14359        |
|    total_timesteps      | 1964032      |
| train/                  |              |
|    approx_kl            | 2.561137e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.148        |
|    learning_rate        | 1e-06        |
|    loss                 | 2.98         |
|    n_updates            | 76710        |
|    policy_gradient_loss | -5.93e-06    |
|    value_loss           | 6.18         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 756           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7682          |
|    time_elapsed         | 14378         |
|    total_timesteps      | 1966592       |
| train/                  |               |
|    approx_kl            | 1.4977995e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0302       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.056         |
|    n_updates            | 76810         |
|    policy_gradient_loss | -0.000132     |
|    value_loss           | 0.108         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 756          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7691         |
|    time_elapsed         | 14396        |
|    total_timesteps      | 1968896      |
| train/                  |              |
|    approx_kl            | 1.785811e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0794       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0559       |
|    n_updates            | 76900        |
|    policy_gradient_loss | -3.41e-05    |
|    value_loss           | 0.0847       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 756          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7700         |
|    time_elapsed         | 14414        |
|    total_timesteps      | 1971200      |
| train/                  |              |
|    approx_kl            | 1.094304e-08 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | -0.0263      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.15         |
|    n_updates            | 76990        |
|    policy_gradient_loss | -6.84e-06    |
|    value_loss           | 0.293        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 756           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7709          |
|    time_elapsed         | 14431         |
|    total_timesteps      | 1973504       |
| train/                  |               |
|    approx_kl            | 1.8905848e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0406        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.127         |
|    n_updates            | 77080         |
|    policy_gradient_loss | -5.28e-05     |
|    value_loss           | 0.218         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 756           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7718          |
|    time_elapsed         | 14448         |
|    total_timesteps      | 1975808       |
| train/                  |               |
|    approx_kl            | 1.0011718e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.385         |
|    learning_rate        | 1e-06         |
|    loss                 | 76.7          |
|    n_updates            | 77170         |
|    policy_gradient_loss | 8.04e-07      |
|    value_loss           | 117           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 756           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7727          |
|    time_elapsed         | 14465         |
|    total_timesteps      | 1978112       |
| train/                  |               |
|    approx_kl            | 1.6763806e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.437         |
|    learning_rate        | 1e-06         |
|    loss                 | 107           |
|    n_updates            | 77260         |
|    policy_gradient_loss | 1.65e-05      |
|    value_loss           | 166           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 756           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7736          |
|    time_elapsed         | 14483         |
|    total_timesteps      | 1980416       |
| train/                  |               |
|    approx_kl            | 4.2957254e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00176       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.045         |
|    n_updates            | 77350         |
|    policy_gradient_loss | -7.89e-05     |
|    value_loss           | 0.0854        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 756           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7745          |
|    time_elapsed         | 14500         |
|    total_timesteps      | 1982720       |
| train/                  |               |
|    approx_kl            | 6.9546513e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.123        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0621        |
|    n_updates            | 77440         |
|    policy_gradient_loss | -5.1e-05      |
|    value_loss           | 0.105         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 756          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7754         |
|    time_elapsed         | 14517        |
|    total_timesteps      | 1985024      |
| train/                  |              |
|    approx_kl            | 3.883615e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00359      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0385       |
|    n_updates            | 77530        |
|    policy_gradient_loss | -3.34e-05    |
|    value_loss           | 0.0898       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 759           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7763          |
|    time_elapsed         | 14534         |
|    total_timesteps      | 1987328       |
| train/                  |               |
|    approx_kl            | 1.1525117e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.103         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0419        |
|    n_updates            | 77620         |
|    policy_gradient_loss | -2.89e-05     |
|    value_loss           | 0.0881        |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 759           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7772          |
|    time_elapsed         | 14551         |
|    total_timesteps      | 1989632       |
| train/                  |               |
|    approx_kl            | 3.8486905e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0954       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.047         |
|    n_updates            | 77710         |
|    policy_gradient_loss | -9.51e-05     |
|    value_loss           | 0.0945        |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.71e+04     |
|    ep_rew_mean          | 759          |
| time/                   |              |
|    fps                  | 136          |
|    iterations           | 7781         |
|    time_elapsed         | 14569        |
|    total_timesteps      | 1991936      |
| train/                  |              |
|    approx_kl            | 4.398171e-07 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.0596       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0392       |
|    n_updates            | 77800        |
|    policy_gradient_loss | -8.52e-05    |
|    value_loss           | 0.0827       |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 759           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7790          |
|    time_elapsed         | 14586         |
|    total_timesteps      | 1994240       |
| train/                  |               |
|    approx_kl            | 1.1641532e-08 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.317         |
|    learning_rate        | 1e-06         |
|    loss                 | 312           |
|    n_updates            | 77890         |
|    policy_gradient_loss | 5.79e-06      |
|    value_loss           | 652           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 759           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7799          |
|    time_elapsed         | 14603         |
|    total_timesteps      | 1996544       |
| train/                  |               |
|    approx_kl            | 4.1909516e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.00231       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.139         |
|    n_updates            | 77980         |
|    policy_gradient_loss | -5.59e-05     |
|    value_loss           | 0.244         |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.71e+04      |
|    ep_rew_mean          | 759           |
| time/                   |               |
|    fps                  | 136           |
|    iterations           | 7808          |
|    time_elapsed         | 14620         |
|    total_timesteps      | 1998848       |
| train/                  |               |
|    approx_kl            | 2.8405339e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | -0.0111       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.102         |
|    n_updates            | 78070         |
|    policy_gradient_loss | -2.22e-05     |
|    value_loss           | 0.214         |
-------------------------------------------
-------------------------------------------
| rollout/                |     

<stable_baselines3.ppo.ppo.PPO at 0x26a106d8820>

In [9]:
model.save("ppo_mlp_model_seed20")