In [1]:
!pip install gym_super_mario_bros==7.3.0 nes_py



In [2]:
# Import the game
import gym_super_mario_bros
# Import the Joypad wrapper
from nes_py.wrappers import JoypadSpace
# Import the SIMPLIFIED controls
from gym_super_mario_bros.actions import SIMPLE_MOVEMENT

In [3]:
!pip install torch==1.10.1+cu113 torchvision==0.11.2+cu113 torchaudio===0.10.1+cu113 -f https://download.pytorch.org/whl/cu113/torch_stable.html

Looking in links: https://download.pytorch.org/whl/cu113/torch_stable.html


In [4]:
# Install stable baselines 3
!pip install stable-baselines3[extra]



In [5]:
# Import Frame Stacker Wrapper and GrayScaling Wrapper
from gym.wrappers import GrayScaleObservation
# Import Vectorization Wrappers
from stable_baselines3.common.vec_env import VecFrameStack, DummyVecEnv
# Import Matplotlib to show the impact of frame stacking
from matplotlib import pyplot as plt
from stable_baselines3.common.logger import TensorBoardOutputFormat

In [6]:
env = gym_super_mario_bros.make('SuperMarioBros-v0')
env = JoypadSpace(env, SIMPLE_MOVEMENT)

In [7]:
 #Import os for file path management
import os 
# Import PPO for model
from stable_baselines3 import PPO
# Import Base Callback for saving models
from stable_baselines3.common.callbacks import BaseCallback

In [8]:
class TrainAndLoggingCallback(BaseCallback):

    def __init__(self, check_freq, save_path, verbose=1):
        super(TrainAndLoggingCallback, self).__init__(verbose)
        self.check_freq = check_freq
        self.save_path = save_path

    def _init_callback(self):
        if self.save_path is not None:
            os.makedirs(self.save_path, exist_ok=True)

    def _on_step(self):
        if self.n_calls % self.check_freq == 0:
            model_path = os.path.join(self.save_path, 'best_model_{}'.format(self.n_calls))
            self.model.save(model_path)

        return True

In [9]:
CHECKPOINT_DIR = './train/'
LOG_DIR = './logs/'

In [10]:
# Setup model saving callback
callback = TrainAndLoggingCallback(check_freq=10000, save_path=CHECKPOINT_DIR)

In [11]:
model = PPO('CnnPolicy', env, verbose=1, tensorboard_log=LOG_DIR, learning_rate=0.000001, 
            n_steps=512) 

Using cuda device
Wrapping the env with a `Monitor` wrapper
Wrapping the env in a DummyVecEnv.
Wrapping the env in a VecTransposeImage.


In [14]:
model.learn(total_timesteps=2000000, callback=callback)

Logging to ./logs/PPO_14
----------------------------
| time/              |     |
|    fps             | 297 |
|    iterations      | 1   |
|    time_elapsed    | 1   |
|    total_timesteps | 512 |
----------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 169          |
|    iterations           | 2            |
|    time_elapsed         | 6            |
|    total_timesteps      | 1024         |
| train/                  |              |
|    approx_kl            | 0.0015186183 |
|    clip_fraction        | 0.00527      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.357       |
|    explained_variance   | 0.889        |
|    learning_rate        | 1e-06        |
|    loss                 | 49.8         |
|    n_updates            | 11750        |
|    policy_gradient_loss | -0.0008      |
|    value_loss           | 127          |
-----------------------------------------

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 800           |
|    ep_rew_mean          | 1.52e+03      |
| time/                   |               |
|    fps                  | 124           |
|    iterations           | 11            |
|    time_elapsed         | 45            |
|    total_timesteps      | 5632          |
| train/                  |               |
|    approx_kl            | 0.00039878802 |
|    clip_fraction        | 0.00645       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.222        |
|    explained_variance   | 0.715         |
|    learning_rate        | 1e-06         |
|    loss                 | 134           |
|    n_updates            | 11840         |
|    policy_gradient_loss | -0.00107      |
|    value_loss           | 478           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 871          |
|    ep_rew_mean          | 1.56e+03     |
| time/                   |              |
|    fps                  | 119          |
|    iterations           | 21           |
|    time_elapsed         | 89           |
|    total_timesteps      | 10752        |
| train/                  |              |
|    approx_kl            | 0.0027917204 |
|    clip_fraction        | 0.00996      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.367       |
|    explained_variance   | 0.764        |
|    learning_rate        | 1e-06        |
|    loss                 | 147          |
|    n_updates            | 11940        |
|    policy_gradient_loss | -0.00354     |
|    value_loss           | 327          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 867           |
|    ep_rew_mean          | 1.54e+03      |
| time/                   |               |
|    fps                  | 118           |
|    iterations           | 31            |
|    time_elapsed         | 133           |
|    total_timesteps      | 15872         |
| train/                  |               |
|    approx_kl            | 0.00014226418 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.265        |
|    explained_variance   | 0.836         |
|    learning_rate        | 1e-06         |
|    loss                 | 112           |
|    n_updates            | 12040         |
|    policy_gradient_loss | 9.04e-05      |
|    value_loss           | 310           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 889           |
|    ep_rew_mean          | 1.59e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 41            |
|    time_elapsed         | 178           |
|    total_timesteps      | 20992         |
| train/                  |               |
|    approx_kl            | 0.00037063519 |
|    clip_fraction        | 0.000586      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.349        |
|    explained_variance   | 0.508         |
|    learning_rate        | 1e-06         |
|    loss                 | 649           |
|    n_updates            | 12140         |
|    policy_gradient_loss | 0.000184      |
|    value_loss           | 785           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 856          |
|    ep_rew_mean          | 1.56e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 51           |
|    time_elapsed         | 222          |
|    total_timesteps      | 26112        |
| train/                  |              |
|    approx_kl            | 0.0009904312 |
|    clip_fraction        | 0.00293      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.24        |
|    explained_variance   | 0.529        |
|    learning_rate        | 1e-06        |
|    loss                 | 87           |
|    n_updates            | 12240        |
|    policy_gradient_loss | -0.00102     |
|    value_loss           | 203          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 854           |
|    ep_rew_mean          | 1.55e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 60            |
|    time_elapsed         | 262           |
|    total_timesteps      | 30720         |
| train/                  |               |
|    approx_kl            | 8.2389684e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.243        |
|    explained_variance   | 0.392         |
|    learning_rate        | 1e-06         |
|    loss                 | 565           |
|    n_updates            | 12330         |
|    policy_gradient_loss | -3.23e-05     |
|    value_loss           | 798           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 858          |
|    ep_rew_mean          | 1.58e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 69           |
|    time_elapsed         | 301          |
|    total_timesteps      | 35328        |
| train/                  |              |
|    approx_kl            | 0.0006272334 |
|    clip_fraction        | 0.00117      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.3         |
|    explained_variance   | 0.844        |
|    learning_rate        | 1e-06        |
|    loss                 | 153          |
|    n_updates            | 12420        |
|    policy_gradient_loss | -0.000834    |
|    value_loss           | 335          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 851          |
|    ep_rew_mean          | 1.55e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 78           |
|    time_elapsed         | 341          |
|    total_timesteps      | 39936        |
| train/                  |              |
|    approx_kl            | 0.0008229456 |
|    clip_fraction        | 0.0111       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.226       |
|    explained_variance   | 0.76         |
|    learning_rate        | 1e-06        |
|    loss                 | 251          |
|    n_updates            | 12510        |
|    policy_gradient_loss | -0.00236     |
|    value_loss           | 722          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 853          |
|    ep_rew_mean          | 1.58e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 87           |
|    time_elapsed         | 380          |
|    total_timesteps      | 44544        |
| train/                  |              |
|    approx_kl            | 0.0004762255 |
|    clip_fraction        | 0.00117      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.243       |
|    explained_variance   | 0.817        |
|    learning_rate        | 1e-06        |
|    loss                 | 50.5         |
|    n_updates            | 12600        |
|    policy_gradient_loss | 4.34e-05     |
|    value_loss           | 163          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 876           |
|    ep_rew_mean          | 1.61e+03      |
| time/                   |               |
|    fps                  | 116           |
|    iterations           | 97            |
|    time_elapsed         | 424           |
|    total_timesteps      | 49664         |
| train/                  |               |
|    approx_kl            | 0.00019512489 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.249        |
|    explained_variance   | 0.833         |
|    learning_rate        | 1e-06         |
|    loss                 | 135           |
|    n_updates            | 12700         |
|    policy_gradient_loss | -0.000274     |
|    value_loss           | 332           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 883           |
|    ep_rew_mean          | 1.62e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 107           |
|    time_elapsed         | 468           |
|    total_timesteps      | 54784         |
| train/                  |               |
|    approx_kl            | 0.00020185485 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.359        |
|    explained_variance   | 0.879         |
|    learning_rate        | 1e-06         |
|    loss                 | 112           |
|    n_updates            | 12800         |
|    policy_gradient_loss | -0.000625     |
|    value_loss           | 320           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 902           |
|    ep_rew_mean          | 1.65e+03      |
| time/                   |               |
|    fps                  | 116           |
|    iterations           | 117           |
|    time_elapsed         | 512           |
|    total_timesteps      | 59904         |
| train/                  |               |
|    approx_kl            | 0.00051502767 |
|    clip_fraction        | 0.000977      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.546        |
|    explained_variance   | 0.845         |
|    learning_rate        | 1e-06         |
|    loss                 | 66.1          |
|    n_updates            | 12900         |
|    policy_gradient_loss | -0.00024      |
|    value_loss           | 190           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 910           |
|    ep_rew_mean          | 1.66e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 127           |
|    time_elapsed         | 555           |
|    total_timesteps      | 65024         |
| train/                  |               |
|    approx_kl            | 0.00033011893 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.319        |
|    explained_variance   | 0.613         |
|    learning_rate        | 1e-06         |
|    loss                 | 69.9          |
|    n_updates            | 13000         |
|    policy_gradient_loss | -0.000611     |
|    value_loss           | 179           |
-------------------------------------------
----------------------------------------
| rollout/                |        

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 920           |
|    ep_rew_mean          | 1.68e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 137           |
|    time_elapsed         | 599           |
|    total_timesteps      | 70144         |
| train/                  |               |
|    approx_kl            | 0.00057105464 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.411        |
|    explained_variance   | 0.636         |
|    learning_rate        | 1e-06         |
|    loss                 | 335           |
|    n_updates            | 13100         |
|    policy_gradient_loss | -0.000637     |
|    value_loss           | 1.43e+03      |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 928          |
|    ep_rew_mean          | 1.69e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 146          |
|    time_elapsed         | 637          |
|    total_timesteps      | 74752        |
| train/                  |              |
|    approx_kl            | 0.0015641863 |
|    clip_fraction        | 0.0127       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.205       |
|    explained_variance   | 0.859        |
|    learning_rate        | 1e-06        |
|    loss                 | 133          |
|    n_updates            | 13190        |
|    policy_gradient_loss | -0.00227     |
|    value_loss           | 272          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 947           |
|    ep_rew_mean          | 1.72e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 155           |
|    time_elapsed         | 677           |
|    total_timesteps      | 79360         |
| train/                  |               |
|    approx_kl            | 0.00031308807 |
|    clip_fraction        | 0.00195       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.25         |
|    explained_variance   | 0.483         |
|    learning_rate        | 1e-06         |
|    loss                 | 282           |
|    n_updates            | 13280         |
|    policy_gradient_loss | -0.00106      |
|    value_loss           | 1.04e+03      |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 941           |
|    ep_rew_mean          | 1.72e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 164           |
|    time_elapsed         | 715           |
|    total_timesteps      | 83968         |
| train/                  |               |
|    approx_kl            | 0.00024881447 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.175        |
|    explained_variance   | 0.73          |
|    learning_rate        | 1e-06         |
|    loss                 | 51.2          |
|    n_updates            | 13370         |
|    policy_gradient_loss | -5.47e-05     |
|    value_loss           | 162           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 959           |
|    ep_rew_mean          | 1.73e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 174           |
|    time_elapsed         | 759           |
|    total_timesteps      | 89088         |
| train/                  |               |
|    approx_kl            | 4.4945627e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.242        |
|    explained_variance   | 0.351         |
|    learning_rate        | 1e-06         |
|    loss                 | 243           |
|    n_updates            | 13470         |
|    policy_gradient_loss | -0.000227     |
|    value_loss           | 694           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 947           |
|    ep_rew_mean          | 1.72e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 184           |
|    time_elapsed         | 803           |
|    total_timesteps      | 94208         |
| train/                  |               |
|    approx_kl            | 0.00022645784 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.203        |
|    explained_variance   | 0.714         |
|    learning_rate        | 1e-06         |
|    loss                 | 93            |
|    n_updates            | 13570         |
|    policy_gradient_loss | -0.000232     |
|    value_loss           | 172           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 947           |
|    ep_rew_mean          | 1.72e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 194           |
|    time_elapsed         | 847           |
|    total_timesteps      | 99328         |
| train/                  |               |
|    approx_kl            | 0.00024098821 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.314        |
|    explained_variance   | 0.883         |
|    learning_rate        | 1e-06         |
|    loss                 | 107           |
|    n_updates            | 13670         |
|    policy_gradient_loss | -5.06e-05     |
|    value_loss           | 217           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 950         |
|    ep_rew_mean          | 1.73e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 204         |
|    time_elapsed         | 890         |
|    total_timesteps      | 104448      |
| train/                  |             |
|    approx_kl            | 0.002643066 |
|    clip_fraction        | 0.0254      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.37       |
|    explained_variance   | 0.825       |
|    learning_rate        | 1e-06       |
|    loss                 | 52.9        |
|    n_updates            | 13770       |
|    policy_gradient_loss | -0.00331    |
|    value_loss           | 167         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 953   

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 962          |
|    ep_rew_mean          | 1.75e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 214          |
|    time_elapsed         | 934          |
|    total_timesteps      | 109568       |
| train/                  |              |
|    approx_kl            | 0.0023440965 |
|    clip_fraction        | 0.0137       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.331       |
|    explained_variance   | 0.914        |
|    learning_rate        | 1e-06        |
|    loss                 | 68           |
|    n_updates            | 13870        |
|    policy_gradient_loss | 7.11e-05     |
|    value_loss           | 143          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 976         |
|    ep_rew_mean          | 1.78e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 224         |
|    time_elapsed         | 977         |
|    total_timesteps      | 114688      |
| train/                  |             |
|    approx_kl            | 0.002494506 |
|    clip_fraction        | 0.0285      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.336      |
|    explained_variance   | 0.819       |
|    learning_rate        | 1e-06       |
|    loss                 | 35.6        |
|    n_updates            | 13970       |
|    policy_gradient_loss | -0.00376    |
|    value_loss           | 139         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 976 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 977          |
|    ep_rew_mean          | 1.79e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 234          |
|    time_elapsed         | 1021         |
|    total_timesteps      | 119808       |
| train/                  |              |
|    approx_kl            | 0.0021782275 |
|    clip_fraction        | 0.0219       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.463       |
|    explained_variance   | 0.518        |
|    learning_rate        | 1e-06        |
|    loss                 | 309          |
|    n_updates            | 14070        |
|    policy_gradient_loss | -0.00236     |
|    value_loss           | 697          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 990          |
|    ep_rew_mean          | 1.79e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 244          |
|    time_elapsed         | 1064         |
|    total_timesteps      | 124928       |
| train/                  |              |
|    approx_kl            | 0.0017372478 |
|    clip_fraction        | 0.00703      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.28        |
|    explained_variance   | 0.619        |
|    learning_rate        | 1e-06        |
|    loss                 | 91.4         |
|    n_updates            | 14170        |
|    policy_gradient_loss | -0.00429     |
|    value_loss           | 504          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 996           |
|    ep_rew_mean          | 1.8e+03       |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 253           |
|    time_elapsed         | 1104          |
|    total_timesteps      | 129536        |
| train/                  |               |
|    approx_kl            | 0.00038517406 |
|    clip_fraction        | 0.00332       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.245        |
|    explained_variance   | 0.487         |
|    learning_rate        | 1e-06         |
|    loss                 | 237           |
|    n_updates            | 14260         |
|    policy_gradient_loss | 0.000194      |
|    value_loss           | 695           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 995          |
|    ep_rew_mean          | 1.79e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 263          |
|    time_elapsed         | 1147         |
|    total_timesteps      | 134656       |
| train/                  |              |
|    approx_kl            | 0.0016695416 |
|    clip_fraction        | 0.0271       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.181       |
|    explained_variance   | 0.863        |
|    learning_rate        | 1e-06        |
|    loss                 | 19.2         |
|    n_updates            | 14360        |
|    policy_gradient_loss | -0.00317     |
|    value_loss           | 51.5         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1e+03         |
|    ep_rew_mean          | 1.8e+03       |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 273           |
|    time_elapsed         | 1191          |
|    total_timesteps      | 139776        |
| train/                  |               |
|    approx_kl            | 0.00018063176 |
|    clip_fraction        | 0.000586      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.286        |
|    explained_variance   | 0.919         |
|    learning_rate        | 1e-06         |
|    loss                 | 62.6          |
|    n_updates            | 14460         |
|    policy_gradient_loss | -0.000442     |
|    value_loss           | 176           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.82e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 283          |
|    time_elapsed         | 1234         |
|    total_timesteps      | 144896       |
| train/                  |              |
|    approx_kl            | 0.0011550533 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.374       |
|    explained_variance   | 0.831        |
|    learning_rate        | 1e-06        |
|    loss                 | 88.9         |
|    n_updates            | 14560        |
|    policy_gradient_loss | 0.00051      |
|    value_loss           | 217          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.01e+03     |
|    ep_rew_mean          | 1.81e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 292          |
|    time_elapsed         | 1274         |
|    total_timesteps      | 149504       |
| train/                  |              |
|    approx_kl            | 0.0015592556 |
|    clip_fraction        | 0.00762      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.329       |
|    explained_variance   | 0.771        |
|    learning_rate        | 1e-06        |
|    loss                 | 189          |
|    n_updates            | 14650        |
|    policy_gradient_loss | -0.0012      |
|    value_loss           | 286          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.01e+03     |
|    ep_rew_mean          | 1.8e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 302          |
|    time_elapsed         | 1317         |
|    total_timesteps      | 154624       |
| train/                  |              |
|    approx_kl            | 0.0018317084 |
|    clip_fraction        | 0.0115       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.333       |
|    explained_variance   | 0.718        |
|    learning_rate        | 1e-06        |
|    loss                 | 80.4         |
|    n_updates            | 14750        |
|    policy_gradient_loss | -0.0015      |
|    value_loss           | 203          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.02e+03    |
|    ep_rew_mean          | 1.81e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 312         |
|    time_elapsed         | 1361        |
|    total_timesteps      | 159744      |
| train/                  |             |
|    approx_kl            | 0.001353431 |
|    clip_fraction        | 0.000977    |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.424      |
|    explained_variance   | 0.815       |
|    learning_rate        | 1e-06       |
|    loss                 | 122         |
|    n_updates            | 14850       |
|    policy_gradient_loss | -0.00105    |
|    value_loss           | 347         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.01e+03     |
|    ep_rew_mean          | 1.81e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 322          |
|    time_elapsed         | 1404         |
|    total_timesteps      | 164864       |
| train/                  |              |
|    approx_kl            | 0.0004537094 |
|    clip_fraction        | 0.000391     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.276       |
|    explained_variance   | 0.885        |
|    learning_rate        | 1e-06        |
|    loss                 | 140          |
|    n_updates            | 14950        |
|    policy_gradient_loss | -0.002       |
|    value_loss           | 212          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.81e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 332          |
|    time_elapsed         | 1449         |
|    total_timesteps      | 169984       |
| train/                  |              |
|    approx_kl            | 0.0004041911 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.254       |
|    explained_variance   | 0.812        |
|    learning_rate        | 1e-06        |
|    loss                 | 230          |
|    n_updates            | 15050        |
|    policy_gradient_loss | -0.00131     |
|    value_loss           | 530          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.03e+03    |
|    ep_rew_mean          | 1.83e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 342         |
|    time_elapsed         | 1492        |
|    total_timesteps      | 175104      |
| train/                  |             |
|    approx_kl            | 0.003319243 |
|    clip_fraction        | 0.0137      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.579      |
|    explained_variance   | 0.916       |
|    learning_rate        | 1e-06       |
|    loss                 | 97.4        |
|    n_updates            | 15150       |
|    policy_gradient_loss | -0.00335    |
|    value_loss           | 313         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.8e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 352          |
|    time_elapsed         | 1536         |
|    total_timesteps      | 180224       |
| train/                  |              |
|    approx_kl            | 0.0002152666 |
|    clip_fraction        | 0.000195     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.329       |
|    explained_variance   | 0.709        |
|    learning_rate        | 1e-06        |
|    loss                 | 144          |
|    n_updates            | 15250        |
|    policy_gradient_loss | -0.000607    |
|    value_loss           | 306          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.83e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 362          |
|    time_elapsed         | 1579         |
|    total_timesteps      | 185344       |
| train/                  |              |
|    approx_kl            | 0.0007404509 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.61        |
|    explained_variance   | 0.768        |
|    learning_rate        | 1e-06        |
|    loss                 | 592          |
|    n_updates            | 15350        |
|    policy_gradient_loss | 0.000125     |
|    value_loss           | 1.14e+03     |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.04e+03      |
|    ep_rew_mean          | 1.82e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 372           |
|    time_elapsed         | 1623          |
|    total_timesteps      | 190464        |
| train/                  |               |
|    approx_kl            | 0.00043882744 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.379        |
|    explained_variance   | 0.88          |
|    learning_rate        | 1e-06         |
|    loss                 | 110           |
|    n_updates            | 15450         |
|    policy_gradient_loss | -0.00131      |
|    value_loss           | 350           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.83e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 382          |
|    time_elapsed         | 1666         |
|    total_timesteps      | 195584       |
| train/                  |              |
|    approx_kl            | 0.0006267637 |
|    clip_fraction        | 0.00332      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.337       |
|    explained_variance   | 0.684        |
|    learning_rate        | 1e-06        |
|    loss                 | 154          |
|    n_updates            | 15550        |
|    policy_gradient_loss | -0.00233     |
|    value_loss           | 515          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06e+03     |
|    ep_rew_mean          | 1.85e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 392          |
|    time_elapsed         | 1710         |
|    total_timesteps      | 200704       |
| train/                  |              |
|    approx_kl            | 0.0010326746 |
|    clip_fraction        | 0.0131       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.281       |
|    explained_variance   | 0.568        |
|    learning_rate        | 1e-06        |
|    loss                 | 436          |
|    n_updates            | 15650        |
|    policy_gradient_loss | -0.00241     |
|    value_loss           | 887          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06e+03     |
|    ep_rew_mean          | 1.85e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 402          |
|    time_elapsed         | 1753         |
|    total_timesteps      | 205824       |
| train/                  |              |
|    approx_kl            | 0.0010031081 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.531       |
|    explained_variance   | 0.952        |
|    learning_rate        | 1e-06        |
|    loss                 | 64.4         |
|    n_updates            | 15750        |
|    policy_gradient_loss | -6.07e-05    |
|    value_loss           | 213          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.06e+03    |
|    ep_rew_mean          | 1.86e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 412         |
|    time_elapsed         | 1797        |
|    total_timesteps      | 210944      |
| train/                  |             |
|    approx_kl            | 0.001040995 |
|    clip_fraction        | 0.00254     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.463      |
|    explained_variance   | 0.828       |
|    learning_rate        | 1e-06       |
|    loss                 | 38.1        |
|    n_updates            | 15850       |
|    policy_gradient_loss | -0.00109    |
|    value_loss           | 146         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06e+03     |
|    ep_rew_mean          | 1.86e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 422          |
|    time_elapsed         | 1841         |
|    total_timesteps      | 216064       |
| train/                  |              |
|    approx_kl            | 0.0025880085 |
|    clip_fraction        | 0.0229       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.514       |
|    explained_variance   | 0.894        |
|    learning_rate        | 1e-06        |
|    loss                 | 133          |
|    n_updates            | 15950        |
|    policy_gradient_loss | -0.00373     |
|    value_loss           | 296          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_rew_mean          | 1.87e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 432          |
|    time_elapsed         | 1885         |
|    total_timesteps      | 221184       |
| train/                  |              |
|    approx_kl            | 0.0021674177 |
|    clip_fraction        | 0.00859      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.299       |
|    explained_variance   | 0.715        |
|    learning_rate        | 1e-06        |
|    loss                 | 97.9         |
|    n_updates            | 16050        |
|    policy_gradient_loss | -0.00112     |
|    value_loss           | 246          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.86e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 441           |
|    time_elapsed         | 1923          |
|    total_timesteps      | 225792        |
| train/                  |               |
|    approx_kl            | 0.00064052315 |
|    clip_fraction        | 0.00488       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.324        |
|    explained_variance   | 0.518         |
|    learning_rate        | 1e-06         |
|    loss                 | 526           |
|    n_updates            | 16140         |
|    policy_gradient_loss | -0.000619     |
|    value_loss           | 889           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.88e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 451           |
|    time_elapsed         | 1967          |
|    total_timesteps      | 230912        |
| train/                  |               |
|    approx_kl            | 0.00091918453 |
|    clip_fraction        | 0.00508       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.456        |
|    explained_variance   | 0.936         |
|    learning_rate        | 1e-06         |
|    loss                 | 18.4          |
|    n_updates            | 16240         |
|    policy_gradient_loss | -0.00311      |
|    value_loss           | 83.1          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 460          |
|    time_elapsed         | 2006         |
|    total_timesteps      | 235520       |
| train/                  |              |
|    approx_kl            | 0.0026995619 |
|    clip_fraction        | 0.00352      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.611       |
|    explained_variance   | 0.792        |
|    learning_rate        | 1e-06        |
|    loss                 | 115          |
|    n_updates            | 16330        |
|    policy_gradient_loss | 0.00166      |
|    value_loss           | 375          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.09e+03      |
|    ep_rew_mean          | 1.9e+03       |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 470           |
|    time_elapsed         | 2050          |
|    total_timesteps      | 240640        |
| train/                  |               |
|    approx_kl            | 0.00078088336 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.5          |
|    explained_variance   | 0.863         |
|    learning_rate        | 1e-06         |
|    loss                 | 60            |
|    n_updates            | 16430         |
|    policy_gradient_loss | -0.000652     |
|    value_loss           | 190           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 479          |
|    time_elapsed         | 2088         |
|    total_timesteps      | 245248       |
| train/                  |              |
|    approx_kl            | 0.0011624023 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.309       |
|    explained_variance   | 0.907        |
|    learning_rate        | 1e-06        |
|    loss                 | 47.2         |
|    n_updates            | 16520        |
|    policy_gradient_loss | -0.000822    |
|    value_loss           | 106          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 488          |
|    time_elapsed         | 2128         |
|    total_timesteps      | 249856       |
| train/                  |              |
|    approx_kl            | 0.0019660797 |
|    clip_fraction        | 0.018        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.235       |
|    explained_variance   | 0.861        |
|    learning_rate        | 1e-06        |
|    loss                 | 106          |
|    n_updates            | 16610        |
|    policy_gradient_loss | -0.00163     |
|    value_loss           | 142          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.13e+03      |
|    ep_rew_mean          | 1.96e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 498           |
|    time_elapsed         | 2171          |
|    total_timesteps      | 254976        |
| train/                  |               |
|    approx_kl            | 0.00068190624 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.427        |
|    explained_variance   | 0.889         |
|    learning_rate        | 1e-06         |
|    loss                 | 178           |
|    n_updates            | 16710         |
|    policy_gradient_loss | 0.00115       |
|    value_loss           | 453           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14e+03     |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 507          |
|    time_elapsed         | 2211         |
|    total_timesteps      | 259584       |
| train/                  |              |
|    approx_kl            | 0.0013726904 |
|    clip_fraction        | 0.00801      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.313       |
|    explained_variance   | 0.806        |
|    learning_rate        | 1e-06        |
|    loss                 | 332          |
|    n_updates            | 16800        |
|    policy_gradient_loss | -0.00279     |
|    value_loss           | 440          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.14e+03      |
|    ep_rew_mean          | 1.95e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 516           |
|    time_elapsed         | 2249          |
|    total_timesteps      | 264192        |
| train/                  |               |
|    approx_kl            | 0.00060381705 |
|    clip_fraction        | 0.000977      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.347        |
|    explained_variance   | 0.727         |
|    learning_rate        | 1e-06         |
|    loss                 | 303           |
|    n_updates            | 16890         |
|    policy_gradient_loss | -0.00103      |
|    value_loss           | 367           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.15e+03     |
|    ep_rew_mean          | 1.97e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 525          |
|    time_elapsed         | 2289         |
|    total_timesteps      | 268800       |
| train/                  |              |
|    approx_kl            | 0.0003286266 |
|    clip_fraction        | 0.000195     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.324       |
|    explained_variance   | 0.826        |
|    learning_rate        | 1e-06        |
|    loss                 | 66           |
|    n_updates            | 16980        |
|    policy_gradient_loss | -0.000741    |
|    value_loss           | 148          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.16e+03    |
|    ep_rew_mean          | 1.99e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 535         |
|    time_elapsed         | 2332        |
|    total_timesteps      | 273920      |
| train/                  |             |
|    approx_kl            | 0.002544405 |
|    clip_fraction        | 0.00547     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.682      |
|    explained_variance   | 0.732       |
|    learning_rate        | 1e-06       |
|    loss                 | 337         |
|    n_updates            | 17080       |
|    policy_gradient_loss | -0.00192    |
|    value_loss           | 490         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.16

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.17e+03      |
|    ep_rew_mean          | 1.99e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 545           |
|    time_elapsed         | 2376          |
|    total_timesteps      | 279040        |
| train/                  |               |
|    approx_kl            | 0.00036696822 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.546        |
|    explained_variance   | 0.263         |
|    learning_rate        | 1e-06         |
|    loss                 | 146           |
|    n_updates            | 17180         |
|    policy_gradient_loss | 0.00077       |
|    value_loss           | 801           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.18e+03    |
|    ep_rew_mean          | 1.99e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 555         |
|    time_elapsed         | 2419        |
|    total_timesteps      | 284160      |
| train/                  |             |
|    approx_kl            | 0.001717022 |
|    clip_fraction        | 0.00684     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.485      |
|    explained_variance   | 0.889       |
|    learning_rate        | 1e-06       |
|    loss                 | 90.8        |
|    n_updates            | 17280       |
|    policy_gradient_loss | -0.00159    |
|    value_loss           | 182         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.18

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.19e+03      |
|    ep_rew_mean          | 2.01e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 565           |
|    time_elapsed         | 2463          |
|    total_timesteps      | 289280        |
| train/                  |               |
|    approx_kl            | 0.00095690985 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.684        |
|    explained_variance   | 0.345         |
|    learning_rate        | 1e-06         |
|    loss                 | 240           |
|    n_updates            | 17380         |
|    policy_gradient_loss | -0.000294     |
|    value_loss           | 1.24e+03      |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 575          |
|    time_elapsed         | 2506         |
|    total_timesteps      | 294400       |
| train/                  |              |
|    approx_kl            | 0.0010996391 |
|    clip_fraction        | 0.0041       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.371       |
|    explained_variance   | 0.895        |
|    learning_rate        | 1e-06        |
|    loss                 | 185          |
|    n_updates            | 17480        |
|    policy_gradient_loss | -0.00219     |
|    value_loss           | 383          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.2e+03     |
|    ep_rew_mean          | 2.02e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 585         |
|    time_elapsed         | 2550        |
|    total_timesteps      | 299520      |
| train/                  |             |
|    approx_kl            | 0.001911553 |
|    clip_fraction        | 0.0221      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.573      |
|    explained_variance   | 0.909       |
|    learning_rate        | 1e-06       |
|    loss                 | 238         |
|    n_updates            | 17580       |
|    policy_gradient_loss | -0.00189    |
|    value_loss           | 295         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.19e+

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.19e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 595          |
|    time_elapsed         | 2593         |
|    total_timesteps      | 304640       |
| train/                  |              |
|    approx_kl            | 0.0006421354 |
|    clip_fraction        | 0.0135       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.418       |
|    explained_variance   | 0.679        |
|    learning_rate        | 1e-06        |
|    loss                 | 183          |
|    n_updates            | 17680        |
|    policy_gradient_loss | -0.00199     |
|    value_loss           | 777          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.19e+03      |
|    ep_rew_mean          | 2.01e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 605           |
|    time_elapsed         | 2637          |
|    total_timesteps      | 309760        |
| train/                  |               |
|    approx_kl            | 0.00057302404 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.65         |
|    explained_variance   | -1.4          |
|    learning_rate        | 1e-06         |
|    loss                 | 0.188         |
|    n_updates            | 17780         |
|    policy_gradient_loss | -0.0007       |
|    value_loss           | 0.681         |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.19e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 614          |
|    time_elapsed         | 2676         |
|    total_timesteps      | 314368       |
| train/                  |              |
|    approx_kl            | 0.0010268793 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.59        |
|    explained_variance   | -0.231       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.209        |
|    n_updates            | 17870        |
|    policy_gradient_loss | -0.00276     |
|    value_loss           | 0.415        |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

--------------------------------------------
| rollout/                |                |
|    ep_len_mean          | 1.31e+03       |
|    ep_rew_mean          | 2.04e+03       |
| time/                   |                |
|    fps                  | 117            |
|    iterations           | 624            |
|    time_elapsed         | 2721           |
|    total_timesteps      | 319488         |
| train/                  |                |
|    approx_kl            | 0.000113867805 |
|    clip_fraction        | 0.00117        |
|    clip_range           | 0.2            |
|    entropy_loss         | -0.0521        |
|    explained_variance   | 0.326          |
|    learning_rate        | 1e-06          |
|    loss                 | 532            |
|    n_updates            | 17970          |
|    policy_gradient_loss | 0.000521       |
|    value_loss           | 1.25e+03       |
--------------------------------------------
-------------------------------------------
| rollout/ 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.3e+03       |
|    ep_rew_mean          | 2.01e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 633           |
|    time_elapsed         | 2759          |
|    total_timesteps      | 324096        |
| train/                  |               |
|    approx_kl            | 4.4476823e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.152        |
|    explained_variance   | 0.851         |
|    learning_rate        | 1e-06         |
|    loss                 | 46.5          |
|    n_updates            | 18060         |
|    policy_gradient_loss | 0.000242      |
|    value_loss           | 118           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.31e+03      |
|    ep_rew_mean          | 2.02e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 642           |
|    time_elapsed         | 2799          |
|    total_timesteps      | 328704        |
| train/                  |               |
|    approx_kl            | 0.00012911984 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.19         |
|    explained_variance   | 0.667         |
|    learning_rate        | 1e-06         |
|    loss                 | 58.6          |
|    n_updates            | 18150         |
|    policy_gradient_loss | 0.0009        |
|    value_loss           | 159           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.3e+03       |
|    ep_rew_mean          | 2.01e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 651           |
|    time_elapsed         | 2837          |
|    total_timesteps      | 333312        |
| train/                  |               |
|    approx_kl            | 0.00044084596 |
|    clip_fraction        | 0.000586      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.193        |
|    explained_variance   | 0.663         |
|    learning_rate        | 1e-06         |
|    loss                 | 30.8          |
|    n_updates            | 18240         |
|    policy_gradient_loss | -0.000913     |
|    value_loss           | 125           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.32e+03    |
|    ep_rew_mean          | 2.03e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 660         |
|    time_elapsed         | 2876        |
|    total_timesteps      | 337920      |
| train/                  |             |
|    approx_kl            | 0.002300444 |
|    clip_fraction        | 0.0121      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.344      |
|    explained_variance   | 0.826       |
|    learning_rate        | 1e-06       |
|    loss                 | 223         |
|    n_updates            | 18330       |
|    policy_gradient_loss | -0.00266    |
|    value_loss           | 447         |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.3e+03      |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 670          |
|    time_elapsed         | 2920         |
|    total_timesteps      | 343040       |
| train/                  |              |
|    approx_kl            | 0.0014315619 |
|    clip_fraction        | 0.00352      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.256       |
|    explained_variance   | 0.716        |
|    learning_rate        | 1e-06        |
|    loss                 | 169          |
|    n_updates            | 18430        |
|    policy_gradient_loss | -0.000528    |
|    value_loss           | 451          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.28e+03      |
|    ep_rew_mean          | 1.98e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 680           |
|    time_elapsed         | 2963          |
|    total_timesteps      | 348160        |
| train/                  |               |
|    approx_kl            | 0.00047546008 |
|    clip_fraction        | 0.000586      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.303        |
|    explained_variance   | 0.857         |
|    learning_rate        | 1e-06         |
|    loss                 | 48.4          |
|    n_updates            | 18530         |
|    policy_gradient_loss | -0.000645     |
|    value_loss           | 226           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.28e+03      |
|    ep_rew_mean          | 1.96e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 690           |
|    time_elapsed         | 3008          |
|    total_timesteps      | 353280        |
| train/                  |               |
|    approx_kl            | 0.00012685312 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.324        |
|    explained_variance   | 0.733         |
|    learning_rate        | 1e-06         |
|    loss                 | 266           |
|    n_updates            | 18630         |
|    policy_gradient_loss | 0.000157      |
|    value_loss           | 569           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.32e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 699          |
|    time_elapsed         | 3047         |
|    total_timesteps      | 357888       |
| train/                  |              |
|    approx_kl            | 0.0011930059 |
|    clip_fraction        | 0.0373       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.307       |
|    explained_variance   | 0.635        |
|    learning_rate        | 1e-06        |
|    loss                 | 229          |
|    n_updates            | 18720        |
|    policy_gradient_loss | -0.00204     |
|    value_loss           | 860          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.31e+03      |
|    ep_rew_mean          | 2.01e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 709           |
|    time_elapsed         | 3091          |
|    total_timesteps      | 363008        |
| train/                  |               |
|    approx_kl            | 0.00020218536 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.269        |
|    explained_variance   | 0.903         |
|    learning_rate        | 1e-06         |
|    loss                 | 42.7          |
|    n_updates            | 18820         |
|    policy_gradient_loss | 0.000243      |
|    value_loss           | 163           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.31e+03      |
|    ep_rew_mean          | 1.99e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 719           |
|    time_elapsed         | 3134          |
|    total_timesteps      | 368128        |
| train/                  |               |
|    approx_kl            | 0.00023852859 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.269        |
|    explained_variance   | 0.715         |
|    learning_rate        | 1e-06         |
|    loss                 | 36.4          |
|    n_updates            | 18920         |
|    policy_gradient_loss | -0.00081      |
|    value_loss           | 158           |
-------------------------------------------
----------------------------------------
| rollout/                |        

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.29e+03     |
|    ep_rew_mean          | 1.97e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 729          |
|    time_elapsed         | 3178         |
|    total_timesteps      | 373248       |
| train/                  |              |
|    approx_kl            | 0.0016189474 |
|    clip_fraction        | 0.0143       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.277       |
|    explained_variance   | 0.676        |
|    learning_rate        | 1e-06        |
|    loss                 | 596          |
|    n_updates            | 19020        |
|    policy_gradient_loss | -0.00191     |
|    value_loss           | 948          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.3e+03      |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 739          |
|    time_elapsed         | 3221         |
|    total_timesteps      | 378368       |
| train/                  |              |
|    approx_kl            | 0.0014350832 |
|    clip_fraction        | 0.000977     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.501       |
|    explained_variance   | 0.645        |
|    learning_rate        | 1e-06        |
|    loss                 | 108          |
|    n_updates            | 19120        |
|    policy_gradient_loss | -1.22e-05    |
|    value_loss           | 203          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.3e+03      |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 749          |
|    time_elapsed         | 3266         |
|    total_timesteps      | 383488       |
| train/                  |              |
|    approx_kl            | 0.0017417495 |
|    clip_fraction        | 0.00273      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.691       |
|    explained_variance   | 0.642        |
|    learning_rate        | 1e-06        |
|    loss                 | 352          |
|    n_updates            | 19220        |
|    policy_gradient_loss | 0.000521     |
|    value_loss           | 767          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.3e+03      |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 759          |
|    time_elapsed         | 3309         |
|    total_timesteps      | 388608       |
| train/                  |              |
|    approx_kl            | 0.0009967957 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.34        |
|    explained_variance   | -1.9         |
|    learning_rate        | 1e-06        |
|    loss                 | 0.291        |
|    n_updates            | 19320        |
|    policy_gradient_loss | -0.000686    |
|    value_loss           | 1.15         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.39e+03    |
|    ep_rew_mean          | 1.98e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 769         |
|    time_elapsed         | 3353        |
|    total_timesteps      | 393728      |
| train/                  |             |
|    approx_kl            | 0.001000181 |
|    clip_fraction        | 0.00176     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.562      |
|    explained_variance   | 0.906       |
|    learning_rate        | 1e-06       |
|    loss                 | 89.7        |
|    n_updates            | 19420       |
|    policy_gradient_loss | -0.00134    |
|    value_loss           | 212         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.39e+

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.39e+03      |
|    ep_rew_mean          | 2e+03         |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 779           |
|    time_elapsed         | 3397          |
|    total_timesteps      | 398848        |
| train/                  |               |
|    approx_kl            | 0.00063534826 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.444        |
|    explained_variance   | 0.746         |
|    learning_rate        | 1e-06         |
|    loss                 | 59.3          |
|    n_updates            | 19520         |
|    policy_gradient_loss | 0.00217       |
|    value_loss           | 229           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.4e+03       |
|    ep_rew_mean          | 2.01e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 788           |
|    time_elapsed         | 3436          |
|    total_timesteps      | 403456        |
| train/                  |               |
|    approx_kl            | 0.00012223842 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.291        |
|    explained_variance   | 0.804         |
|    learning_rate        | 1e-06         |
|    loss                 | 263           |
|    n_updates            | 19610         |
|    policy_gradient_loss | -8.18e-05     |
|    value_loss           | 432           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.39e+03     |
|    ep_rew_mean          | 1.99e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 797          |
|    time_elapsed         | 3474         |
|    total_timesteps      | 408064       |
| train/                  |              |
|    approx_kl            | 0.0006784543 |
|    clip_fraction        | 0.000195     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.503       |
|    explained_variance   | 0.47         |
|    learning_rate        | 1e-06        |
|    loss                 | 375          |
|    n_updates            | 19700        |
|    policy_gradient_loss | 0.000226     |
|    value_loss           | 765          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.36e+03      |
|    ep_rew_mean          | 1.96e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 807           |
|    time_elapsed         | 3519          |
|    total_timesteps      | 413184        |
| train/                  |               |
|    approx_kl            | 0.00025960582 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.303        |
|    explained_variance   | 0.94          |
|    learning_rate        | 1e-06         |
|    loss                 | 46.1          |
|    n_updates            | 19800         |
|    policy_gradient_loss | 0.000224      |
|    value_loss           | 86.9          |
-------------------------------------------
----------------------------------------
| rollout/                |        

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.36e+03     |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 817          |
|    time_elapsed         | 3561         |
|    total_timesteps      | 418304       |
| train/                  |              |
|    approx_kl            | 0.0038362588 |
|    clip_fraction        | 0.0115       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.438       |
|    explained_variance   | 0.866        |
|    learning_rate        | 1e-06        |
|    loss                 | 68.8         |
|    n_updates            | 19900        |
|    policy_gradient_loss | -0.00296     |
|    value_loss           | 174          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.34e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 827          |
|    time_elapsed         | 3606         |
|    total_timesteps      | 423424       |
| train/                  |              |
|    approx_kl            | 0.0028227223 |
|    clip_fraction        | 0.0271       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.416       |
|    explained_variance   | 0.742        |
|    learning_rate        | 1e-06        |
|    loss                 | 318          |
|    n_updates            | 20000        |
|    policy_gradient_loss | -0.00243     |
|    value_loss           | 646          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.32e+03     |
|    ep_rew_mean          | 1.92e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 837          |
|    time_elapsed         | 3649         |
|    total_timesteps      | 428544       |
| train/                  |              |
|    approx_kl            | 0.0023718043 |
|    clip_fraction        | 0.0184       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.392       |
|    explained_variance   | 0.674        |
|    learning_rate        | 1e-06        |
|    loss                 | 530          |
|    n_updates            | 20100        |
|    policy_gradient_loss | -0.00227     |
|    value_loss           | 836          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.32e+03      |
|    ep_rew_mean          | 1.9e+03       |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 847           |
|    time_elapsed         | 3693          |
|    total_timesteps      | 433664        |
| train/                  |               |
|    approx_kl            | 0.00033797172 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.386        |
|    explained_variance   | 0.799         |
|    learning_rate        | 1e-06         |
|    loss                 | 98.2          |
|    n_updates            | 20200         |
|    policy_gradient_loss | -0.000138     |
|    value_loss           | 180           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 1.87e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 857           |
|    time_elapsed         | 3737          |
|    total_timesteps      | 438784        |
| train/                  |               |
|    approx_kl            | 0.00021330535 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.345        |
|    explained_variance   | 0.736         |
|    learning_rate        | 1e-06         |
|    loss                 | 70.7          |
|    n_updates            | 20300         |
|    policy_gradient_loss | -0.000538     |
|    value_loss           | 150           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.21e+03     |
|    ep_rew_mean          | 1.9e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 866          |
|    time_elapsed         | 3776         |
|    total_timesteps      | 443392       |
| train/                  |              |
|    approx_kl            | 0.0011839375 |
|    clip_fraction        | 0.00566      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.302       |
|    explained_variance   | 0.811        |
|    learning_rate        | 1e-06        |
|    loss                 | 86.6         |
|    n_updates            | 20390        |
|    policy_gradient_loss | -0.00154     |
|    value_loss           | 158          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.22e+03    |
|    ep_rew_mean          | 1.92e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 876         |
|    time_elapsed         | 3819        |
|    total_timesteps      | 448512      |
| train/                  |             |
|    approx_kl            | 0.000433426 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.29       |
|    explained_variance   | 0.481       |
|    learning_rate        | 1e-06       |
|    loss                 | 381         |
|    n_updates            | 20490       |
|    policy_gradient_loss | -0.0002     |
|    value_loss           | 720         |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.22e+03     |
|    ep_rew_mean          | 1.92e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 886          |
|    time_elapsed         | 3863         |
|    total_timesteps      | 453632       |
| train/                  |              |
|    approx_kl            | 0.0010102141 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.271       |
|    explained_variance   | 0.697        |
|    learning_rate        | 1e-06        |
|    loss                 | 316          |
|    n_updates            | 20590        |
|    policy_gradient_loss | -7.25e-05    |
|    value_loss           | 463          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.21e+03     |
|    ep_rew_mean          | 1.9e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 896          |
|    time_elapsed         | 3907         |
|    total_timesteps      | 458752       |
| train/                  |              |
|    approx_kl            | 0.0024730936 |
|    clip_fraction        | 0.0143       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.325       |
|    explained_variance   | 0.847        |
|    learning_rate        | 1e-06        |
|    loss                 | 96.9         |
|    n_updates            | 20690        |
|    policy_gradient_loss | -0.00111     |
|    value_loss           | 189          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.21e+03      |
|    ep_rew_mean          | 1.91e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 906           |
|    time_elapsed         | 3950          |
|    total_timesteps      | 463872        |
| train/                  |               |
|    approx_kl            | 0.00028584606 |
|    clip_fraction        | 0.00156       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.297        |
|    explained_variance   | 0.867         |
|    learning_rate        | 1e-06         |
|    loss                 | 76.8          |
|    n_updates            | 20790         |
|    policy_gradient_loss | -0.000429     |
|    value_loss           | 177           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.23e+03      |
|    ep_rew_mean          | 1.94e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 916           |
|    time_elapsed         | 3994          |
|    total_timesteps      | 468992        |
| train/                  |               |
|    approx_kl            | 4.6025845e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.292        |
|    explained_variance   | 0.942         |
|    learning_rate        | 1e-06         |
|    loss                 | 30.2          |
|    n_updates            | 20890         |
|    policy_gradient_loss | 9.51e-05      |
|    value_loss           | 67.7          |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.22e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 926          |
|    time_elapsed         | 4037         |
|    total_timesteps      | 474112       |
| train/                  |              |
|    approx_kl            | 0.0015863072 |
|    clip_fraction        | 0.000781     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.354       |
|    explained_variance   | 0.749        |
|    learning_rate        | 1e-06        |
|    loss                 | 186          |
|    n_updates            | 20990        |
|    policy_gradient_loss | -0.00142     |
|    value_loss           | 327          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.19e+03      |
|    ep_rew_mean          | 1.89e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 936           |
|    time_elapsed         | 4081          |
|    total_timesteps      | 479232        |
| train/                  |               |
|    approx_kl            | 0.00051769754 |
|    clip_fraction        | 0.00117       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.259        |
|    explained_variance   | 0.931         |
|    learning_rate        | 1e-06         |
|    loss                 | 37.6          |
|    n_updates            | 21090         |
|    policy_gradient_loss | -0.00067      |
|    value_loss           | 109           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.16e+03      |
|    ep_rew_mean          | 1.88e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 946           |
|    time_elapsed         | 4124          |
|    total_timesteps      | 484352        |
| train/                  |               |
|    approx_kl            | 0.00037928682 |
|    clip_fraction        | 0.00273       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.234        |
|    explained_variance   | 0.453         |
|    learning_rate        | 1e-06         |
|    loss                 | 534           |
|    n_updates            | 21190         |
|    policy_gradient_loss | 0.000118      |
|    value_loss           | 656           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.15e+03      |
|    ep_rew_mean          | 1.87e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 955           |
|    time_elapsed         | 4163          |
|    total_timesteps      | 488960        |
| train/                  |               |
|    approx_kl            | 0.00069922337 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.241        |
|    explained_variance   | 0.783         |
|    learning_rate        | 1e-06         |
|    loss                 | 62.6          |
|    n_updates            | 21280         |
|    policy_gradient_loss | -0.000657     |
|    value_loss           | 178           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.15e+03     |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 965          |
|    time_elapsed         | 4207         |
|    total_timesteps      | 494080       |
| train/                  |              |
|    approx_kl            | 0.0023031044 |
|    clip_fraction        | 0.00664      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.458       |
|    explained_variance   | 0.624        |
|    learning_rate        | 1e-06        |
|    loss                 | 274          |
|    n_updates            | 21380        |
|    policy_gradient_loss | -0.00334     |
|    value_loss           | 615          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 975          |
|    time_elapsed         | 4251         |
|    total_timesteps      | 499200       |
| train/                  |              |
|    approx_kl            | 0.0012978179 |
|    clip_fraction        | 0.000195     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.389       |
|    explained_variance   | 0.879        |
|    learning_rate        | 1e-06        |
|    loss                 | 39           |
|    n_updates            | 21480        |
|    policy_gradient_loss | -0.00101     |
|    value_loss           | 123          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.08e+03      |
|    ep_rew_mean          | 1.88e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 985           |
|    time_elapsed         | 4295          |
|    total_timesteps      | 504320        |
| train/                  |               |
|    approx_kl            | 0.00059093663 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.377        |
|    explained_variance   | 0.856         |
|    learning_rate        | 1e-06         |
|    loss                 | 78.7          |
|    n_updates            | 21580         |
|    policy_gradient_loss | 8.69e-06      |
|    value_loss           | 183           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.88e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 994           |
|    time_elapsed         | 4334          |
|    total_timesteps      | 508928        |
| train/                  |               |
|    approx_kl            | 0.00062480394 |
|    clip_fraction        | 0.00117       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.517        |
|    explained_variance   | 0.445         |
|    learning_rate        | 1e-06         |
|    loss                 | 477           |
|    n_updates            | 21670         |
|    policy_gradient_loss | 0.000355      |
|    value_loss           | 1.01e+03      |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06e+03     |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1004         |
|    time_elapsed         | 4377         |
|    total_timesteps      | 514048       |
| train/                  |              |
|    approx_kl            | 0.0022620321 |
|    clip_fraction        | 0.0398       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.32        |
|    explained_variance   | 0.227        |
|    learning_rate        | 1e-06        |
|    loss                 | 543          |
|    n_updates            | 21770        |
|    policy_gradient_loss | -0.00479     |
|    value_loss           | 1e+03        |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06e+03     |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1014         |
|    time_elapsed         | 4421         |
|    total_timesteps      | 519168       |
| train/                  |              |
|    approx_kl            | 0.0004578462 |
|    clip_fraction        | 0.00234      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.174       |
|    explained_variance   | 0.872        |
|    learning_rate        | 1e-06        |
|    loss                 | 131          |
|    n_updates            | 21870        |
|    policy_gradient_loss | -0.000962    |
|    value_loss           | 332          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1024         |
|    time_elapsed         | 4464         |
|    total_timesteps      | 524288       |
| train/                  |              |
|    approx_kl            | 0.0006242321 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.476       |
|    explained_variance   | 0.926        |
|    learning_rate        | 1e-06        |
|    loss                 | 114          |
|    n_updates            | 21970        |
|    policy_gradient_loss | -3.47e-05    |
|    value_loss           | 173          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.06e+03      |
|    ep_rew_mean          | 1.91e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1033          |
|    time_elapsed         | 4504          |
|    total_timesteps      | 528896        |
| train/                  |               |
|    approx_kl            | 0.00086412905 |
|    clip_fraction        | 0.00469       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.299        |
|    explained_variance   | 0.772         |
|    learning_rate        | 1e-06         |
|    loss                 | 94            |
|    n_updates            | 22060         |
|    policy_gradient_loss | -0.000506     |
|    value_loss           | 273           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1043         |
|    time_elapsed         | 4547         |
|    total_timesteps      | 534016       |
| train/                  |              |
|    approx_kl            | 0.0019018269 |
|    clip_fraction        | 0.0104       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.375       |
|    explained_variance   | 0.348        |
|    learning_rate        | 1e-06        |
|    loss                 | 285          |
|    n_updates            | 22160        |
|    policy_gradient_loss | -0.000778    |
|    value_loss           | 901          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05e+03     |
|    ep_rew_mean          | 1.91e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1053         |
|    time_elapsed         | 4592         |
|    total_timesteps      | 539136       |
| train/                  |              |
|    approx_kl            | 0.0011600758 |
|    clip_fraction        | 0.00391      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.286       |
|    explained_variance   | 0.923        |
|    learning_rate        | 1e-06        |
|    loss                 | 55.8         |
|    n_updates            | 22260        |
|    policy_gradient_loss | -0.00106     |
|    value_loss           | 157          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1063         |
|    time_elapsed         | 4635         |
|    total_timesteps      | 544256       |
| train/                  |              |
|    approx_kl            | 0.0009656553 |
|    clip_fraction        | 0.00117      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.35        |
|    explained_variance   | 0.895        |
|    learning_rate        | 1e-06        |
|    loss                 | 54.3         |
|    n_updates            | 22360        |
|    policy_gradient_loss | -0.00134     |
|    value_loss           | 150          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.03e+03    |
|    ep_rew_mean          | 1.88e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1072        |
|    time_elapsed         | 4675        |
|    total_timesteps      | 548864      |
| train/                  |             |
|    approx_kl            | 0.003496549 |
|    clip_fraction        | 0.0354      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.705      |
|    explained_variance   | 0.587       |
|    learning_rate        | 1e-06       |
|    loss                 | 474         |
|    n_updates            | 22450       |
|    policy_gradient_loss | -0.00123    |
|    value_loss           | 1.2e+03     |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1082         |
|    time_elapsed         | 4718         |
|    total_timesteps      | 553984       |
| train/                  |              |
|    approx_kl            | 0.0011087416 |
|    clip_fraction        | 0.0162       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.323       |
|    explained_variance   | 0.922        |
|    learning_rate        | 1e-06        |
|    loss                 | 58           |
|    n_updates            | 22550        |
|    policy_gradient_loss | -0.00323     |
|    value_loss           | 143          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05e+03     |
|    ep_rew_mean          | 1.9e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1092         |
|    time_elapsed         | 4762         |
|    total_timesteps      | 559104       |
| train/                  |              |
|    approx_kl            | 0.0028082184 |
|    clip_fraction        | 0.00898      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.322       |
|    explained_variance   | 0.773        |
|    learning_rate        | 1e-06        |
|    loss                 | 36.8         |
|    n_updates            | 22650        |
|    policy_gradient_loss | -0.00151     |
|    value_loss           | 121          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.05e+03      |
|    ep_rew_mean          | 1.9e+03       |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1102          |
|    time_elapsed         | 4805          |
|    total_timesteps      | 564224        |
| train/                  |               |
|    approx_kl            | 0.00036366738 |
|    clip_fraction        | 0.00137       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.249        |
|    explained_variance   | 0.806         |
|    learning_rate        | 1e-06         |
|    loss                 | 83.5          |
|    n_updates            | 22750         |
|    policy_gradient_loss | -0.000633     |
|    value_loss           | 220           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.06e+03      |
|    ep_rew_mean          | 1.93e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1112          |
|    time_elapsed         | 4849          |
|    total_timesteps      | 569344        |
| train/                  |               |
|    approx_kl            | 0.00073178764 |
|    clip_fraction        | 0.00234       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.258        |
|    explained_variance   | 0.592         |
|    learning_rate        | 1e-06         |
|    loss                 | 128           |
|    n_updates            | 22850         |
|    policy_gradient_loss | -0.000532     |
|    value_loss           | 351           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1122         |
|    time_elapsed         | 4892         |
|    total_timesteps      | 574464       |
| train/                  |              |
|    approx_kl            | 0.0014749365 |
|    clip_fraction        | 0.0125       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.376       |
|    explained_variance   | 0.876        |
|    learning_rate        | 1e-06        |
|    loss                 | 32.1         |
|    n_updates            | 22950        |
|    policy_gradient_loss | -0.00271     |
|    value_loss           | 92.2         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05e+03     |
|    ep_rew_mean          | 1.92e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1132         |
|    time_elapsed         | 4936         |
|    total_timesteps      | 579584       |
| train/                  |              |
|    approx_kl            | 0.0038531567 |
|    clip_fraction        | 0.035        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.446       |
|    explained_variance   | 0.847        |
|    learning_rate        | 1e-06        |
|    loss                 | 60.3         |
|    n_updates            | 23050        |
|    policy_gradient_loss | -0.00479     |
|    value_loss           | 153          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.93e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1142          |
|    time_elapsed         | 4979          |
|    total_timesteps      | 584704        |
| train/                  |               |
|    approx_kl            | 0.00024642702 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.43         |
|    explained_variance   | 0.821         |
|    learning_rate        | 1e-06         |
|    loss                 | 242           |
|    n_updates            | 23150         |
|    policy_gradient_loss | -0.000171     |
|    value_loss           | 399           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.08e+03      |
|    ep_rew_mean          | 1.95e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1152          |
|    time_elapsed         | 5024          |
|    total_timesteps      | 589824        |
| train/                  |               |
|    approx_kl            | 0.00014504662 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.31         |
|    explained_variance   | 0.838         |
|    learning_rate        | 1e-06         |
|    loss                 | 104           |
|    n_updates            | 23250         |
|    policy_gradient_loss | -0.00013      |
|    value_loss           | 274           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 1.99e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1162         |
|    time_elapsed         | 5067         |
|    total_timesteps      | 594944       |
| train/                  |              |
|    approx_kl            | 0.0016850499 |
|    clip_fraction        | 0.0404       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.534       |
|    explained_variance   | 0.611        |
|    learning_rate        | 1e-06        |
|    loss                 | 865          |
|    n_updates            | 23350        |
|    policy_gradient_loss | -0.00168     |
|    value_loss           | 1.22e+03     |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1172         |
|    time_elapsed         | 5111         |
|    total_timesteps      | 600064       |
| train/                  |              |
|    approx_kl            | 0.0010034413 |
|    clip_fraction        | 0.00527      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.414       |
|    explained_variance   | 0.384        |
|    learning_rate        | 1e-06        |
|    loss                 | 81.2         |
|    n_updates            | 23450        |
|    policy_gradient_loss | -0.00253     |
|    value_loss           | 710          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1182         |
|    time_elapsed         | 5154         |
|    total_timesteps      | 605184       |
| train/                  |              |
|    approx_kl            | 0.0011102812 |
|    clip_fraction        | 0.0129       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.367       |
|    explained_variance   | 0.624        |
|    learning_rate        | 1e-06        |
|    loss                 | 160          |
|    n_updates            | 23550        |
|    policy_gradient_loss | 0.000953     |
|    value_loss           | 693          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1192         |
|    time_elapsed         | 5198         |
|    total_timesteps      | 610304       |
| train/                  |              |
|    approx_kl            | 0.0019176503 |
|    clip_fraction        | 0.0043       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.398       |
|    explained_variance   | 0.242        |
|    learning_rate        | 1e-06        |
|    loss                 | 443          |
|    n_updates            | 23650        |
|    policy_gradient_loss | -0.00108     |
|    value_loss           | 928          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1202         |
|    time_elapsed         | 5241         |
|    total_timesteps      | 615424       |
| train/                  |              |
|    approx_kl            | 0.0012200775 |
|    clip_fraction        | 0.00371      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.506       |
|    explained_variance   | 0.803        |
|    learning_rate        | 1e-06        |
|    loss                 | 204          |
|    n_updates            | 23750        |
|    policy_gradient_loss | -0.00191     |
|    value_loss           | 341          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.13e+03      |
|    ep_rew_mean          | 2.03e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1212          |
|    time_elapsed         | 5286          |
|    total_timesteps      | 620544        |
| train/                  |               |
|    approx_kl            | 0.00067327695 |
|    clip_fraction        | 0.000977      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.53         |
|    explained_variance   | 0.904         |
|    learning_rate        | 1e-06         |
|    loss                 | 58            |
|    n_updates            | 23850         |
|    policy_gradient_loss | -2.71e-05     |
|    value_loss           | 110           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.13e+03    |
|    ep_rew_mean          | 2.01e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1222        |
|    time_elapsed         | 5329        |
|    total_timesteps      | 625664      |
| train/                  |             |
|    approx_kl            | 0.005594299 |
|    clip_fraction        | 0.0684      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.481      |
|    explained_variance   | 0.864       |
|    learning_rate        | 1e-06       |
|    loss                 | 58.6        |
|    n_updates            | 23950       |
|    policy_gradient_loss | -0.00425    |
|    value_loss           | 150         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.13e+

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14e+03     |
|    ep_rew_mean          | 2.03e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1232         |
|    time_elapsed         | 5373         |
|    total_timesteps      | 630784       |
| train/                  |              |
|    approx_kl            | 0.0001806434 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.289       |
|    explained_variance   | 0.871        |
|    learning_rate        | 1e-06        |
|    loss                 | 33.3         |
|    n_updates            | 24050        |
|    policy_gradient_loss | -0.000219    |
|    value_loss           | 149          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.14e+03      |
|    ep_rew_mean          | 2.04e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1241          |
|    time_elapsed         | 5412          |
|    total_timesteps      | 635392        |
| train/                  |               |
|    approx_kl            | 0.00020176673 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.323        |
|    explained_variance   | 0.707         |
|    learning_rate        | 1e-06         |
|    loss                 | 185           |
|    n_updates            | 24140         |
|    policy_gradient_loss | -0.000504     |
|    value_loss           | 586           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.14e+03      |
|    ep_rew_mean          | 2.04e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1251          |
|    time_elapsed         | 5456          |
|    total_timesteps      | 640512        |
| train/                  |               |
|    approx_kl            | 4.8211543e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.305        |
|    explained_variance   | 0.493         |
|    learning_rate        | 1e-06         |
|    loss                 | 575           |
|    n_updates            | 24240         |
|    policy_gradient_loss | 0.000353      |
|    value_loss           | 779           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.13e+03     |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1260         |
|    time_elapsed         | 5495         |
|    total_timesteps      | 645120       |
| train/                  |              |
|    approx_kl            | 0.0012441722 |
|    clip_fraction        | 0.00879      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.274       |
|    explained_variance   | 0.822        |
|    learning_rate        | 1e-06        |
|    loss                 | 110          |
|    n_updates            | 24330        |
|    policy_gradient_loss | -0.000279    |
|    value_loss           | 232          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.15e+03    |
|    ep_rew_mean          | 2.05e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1270        |
|    time_elapsed         | 5539        |
|    total_timesteps      | 650240      |
| train/                  |             |
|    approx_kl            | 0.002609468 |
|    clip_fraction        | 0.0367      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.448      |
|    explained_variance   | 0.691       |
|    learning_rate        | 1e-06       |
|    loss                 | 83.2        |
|    n_updates            | 24430       |
|    policy_gradient_loss | -0.00387    |
|    value_loss           | 474         |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.15e+03     |
|    ep_rew_mean          | 2.07e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1280         |
|    time_elapsed         | 5582         |
|    total_timesteps      | 655360       |
| train/                  |              |
|    approx_kl            | 0.0042303465 |
|    clip_fraction        | 0.0102       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.731       |
|    explained_variance   | 0.942        |
|    learning_rate        | 1e-06        |
|    loss                 | 94.7         |
|    n_updates            | 24530        |
|    policy_gradient_loss | -0.00387     |
|    value_loss           | 150          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.17e+03     |
|    ep_rew_mean          | 2.1e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1290         |
|    time_elapsed         | 5626         |
|    total_timesteps      | 660480       |
| train/                  |              |
|    approx_kl            | 0.0009440661 |
|    clip_fraction        | 0.00156      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.382       |
|    explained_variance   | 0.809        |
|    learning_rate        | 1e-06        |
|    loss                 | 59.9         |
|    n_updates            | 24630        |
|    policy_gradient_loss | 0.000533     |
|    value_loss           | 183          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.13e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1300         |
|    time_elapsed         | 5670         |
|    total_timesteps      | 665600       |
| train/                  |              |
|    approx_kl            | 0.0013211521 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.339       |
|    explained_variance   | 0.848        |
|    learning_rate        | 1e-06        |
|    loss                 | 104          |
|    n_updates            | 24730        |
|    policy_gradient_loss | -0.00065     |
|    value_loss           | 237          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.21e+03     |
|    ep_rew_mean          | 2.14e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1310         |
|    time_elapsed         | 5714         |
|    total_timesteps      | 670720       |
| train/                  |              |
|    approx_kl            | 0.0022094348 |
|    clip_fraction        | 0.00605      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.454       |
|    explained_variance   | 0.9          |
|    learning_rate        | 1e-06        |
|    loss                 | 108          |
|    n_updates            | 24830        |
|    policy_gradient_loss | -0.00265     |
|    value_loss           | 225          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.17e+03     |
|    ep_rew_mean          | 2.1e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1320         |
|    time_elapsed         | 5757         |
|    total_timesteps      | 675840       |
| train/                  |              |
|    approx_kl            | 0.0011914321 |
|    clip_fraction        | 0.00996      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.234       |
|    explained_variance   | 0.844        |
|    learning_rate        | 1e-06        |
|    loss                 | 80.4         |
|    n_updates            | 24930        |
|    policy_gradient_loss | -0.000913    |
|    value_loss           | 215          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.19e+03    |
|    ep_rew_mean          | 2.12e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1330        |
|    time_elapsed         | 5801        |
|    total_timesteps      | 680960      |
| train/                  |             |
|    approx_kl            | 0.008056819 |
|    clip_fraction        | 0.0402      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.47       |
|    explained_variance   | 0.953       |
|    learning_rate        | 1e-06       |
|    loss                 | 22.1        |
|    n_updates            | 25030       |
|    policy_gradient_loss | -0.00587    |
|    value_loss           | 95          |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.19

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.19e+03     |
|    ep_rew_mean          | 2.12e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1340         |
|    time_elapsed         | 5844         |
|    total_timesteps      | 686080       |
| train/                  |              |
|    approx_kl            | 0.0016997596 |
|    clip_fraction        | 0.0197       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.353       |
|    explained_variance   | 0.602        |
|    learning_rate        | 1e-06        |
|    loss                 | 279          |
|    n_updates            | 25130        |
|    policy_gradient_loss | 0.000352     |
|    value_loss           | 811          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.12e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1350         |
|    time_elapsed         | 5888         |
|    total_timesteps      | 691200       |
| train/                  |              |
|    approx_kl            | 0.0053161294 |
|    clip_fraction        | 0.0209       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.764       |
|    explained_variance   | 0.944        |
|    learning_rate        | 1e-06        |
|    loss                 | 199          |
|    n_updates            | 25230        |
|    policy_gradient_loss | 0.00254      |
|    value_loss           | 220          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.12e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1360         |
|    time_elapsed         | 5931         |
|    total_timesteps      | 696320       |
| train/                  |              |
|    approx_kl            | 0.0004790289 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.423       |
|    explained_variance   | 0.814        |
|    learning_rate        | 1e-06        |
|    loss                 | 23.9         |
|    n_updates            | 25330        |
|    policy_gradient_loss | 0.000299     |
|    value_loss           | 104          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.19e+03      |
|    ep_rew_mean          | 2.12e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1370          |
|    time_elapsed         | 5975          |
|    total_timesteps      | 701440        |
| train/                  |               |
|    approx_kl            | 0.00094675634 |
|    clip_fraction        | 0.00137       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.326        |
|    explained_variance   | 0.875         |
|    learning_rate        | 1e-06         |
|    loss                 | 42.8          |
|    n_updates            | 25430         |
|    policy_gradient_loss | -0.000925     |
|    value_loss           | 99.3          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.2e+03       |
|    ep_rew_mean          | 2.13e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1380          |
|    time_elapsed         | 6018          |
|    total_timesteps      | 706560        |
| train/                  |               |
|    approx_kl            | 0.00043649483 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.339        |
|    explained_variance   | 0.655         |
|    learning_rate        | 1e-06         |
|    loss                 | 98.5          |
|    n_updates            | 25530         |
|    policy_gradient_loss | 0.000236      |
|    value_loss           | 456           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.2e+03      |
|    ep_rew_mean          | 2.12e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1389         |
|    time_elapsed         | 6058         |
|    total_timesteps      | 711168       |
| train/                  |              |
|    approx_kl            | 0.0011828783 |
|    clip_fraction        | 0.00879      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.251       |
|    explained_variance   | 0.454        |
|    learning_rate        | 1e-06        |
|    loss                 | 288          |
|    n_updates            | 25620        |
|    policy_gradient_loss | -0.00234     |
|    value_loss           | 842          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.17e+03      |
|    ep_rew_mean          | 2.07e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1399          |
|    time_elapsed         | 6101          |
|    total_timesteps      | 716288        |
| train/                  |               |
|    approx_kl            | 0.00075129967 |
|    clip_fraction        | 0.00625       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.247        |
|    explained_variance   | 0.918         |
|    learning_rate        | 1e-06         |
|    loss                 | 132           |
|    n_updates            | 25720         |
|    policy_gradient_loss | -0.000704     |
|    value_loss           | 200           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.17e+03      |
|    ep_rew_mean          | 2.07e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1409          |
|    time_elapsed         | 6145          |
|    total_timesteps      | 721408        |
| train/                  |               |
|    approx_kl            | 0.00064484077 |
|    clip_fraction        | 0.00488       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.451        |
|    explained_variance   | 0.552         |
|    learning_rate        | 1e-06         |
|    loss                 | 144           |
|    n_updates            | 25820         |
|    policy_gradient_loss | -0.00139      |
|    value_loss           | 539           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.17e+03     |
|    ep_rew_mean          | 2.06e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1419         |
|    time_elapsed         | 6189         |
|    total_timesteps      | 726528       |
| train/                  |              |
|    approx_kl            | 0.0062315576 |
|    clip_fraction        | 0.0225       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.819       |
|    explained_variance   | 0.726        |
|    learning_rate        | 1e-06        |
|    loss                 | 127          |
|    n_updates            | 25920        |
|    policy_gradient_loss | -0.00241     |
|    value_loss           | 299          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.14e+03    |
|    ep_rew_mean          | 2.03e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1429        |
|    time_elapsed         | 6233        |
|    total_timesteps      | 731648      |
| train/                  |             |
|    approx_kl            | 0.004278279 |
|    clip_fraction        | 0.0473      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.505      |
|    explained_variance   | 0.814       |
|    learning_rate        | 1e-06       |
|    loss                 | 31.3        |
|    n_updates            | 26020       |
|    policy_gradient_loss | -0.00531    |
|    value_loss           | 96.5        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14e+03     |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1439         |
|    time_elapsed         | 6276         |
|    total_timesteps      | 736768       |
| train/                  |              |
|    approx_kl            | 0.0032706398 |
|    clip_fraction        | 0.0182       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.406       |
|    explained_variance   | 0.188        |
|    learning_rate        | 1e-06        |
|    loss                 | 810          |
|    n_updates            | 26120        |
|    policy_gradient_loss | -0.00265     |
|    value_loss           | 880          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.13e+03    |
|    ep_rew_mean          | 2e+03       |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1449        |
|    time_elapsed         | 6320        |
|    total_timesteps      | 741888      |
| train/                  |             |
|    approx_kl            | 0.005046799 |
|    clip_fraction        | 0.0383      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.5        |
|    explained_variance   | 0.613       |
|    learning_rate        | 1e-06       |
|    loss                 | 370         |
|    n_updates            | 26220       |
|    policy_gradient_loss | -0.00266    |
|    value_loss           | 1e+03       |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.13

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.13e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1459         |
|    time_elapsed         | 6363         |
|    total_timesteps      | 747008       |
| train/                  |              |
|    approx_kl            | 0.0020704274 |
|    clip_fraction        | 0.0297       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.435       |
|    explained_variance   | 0.518        |
|    learning_rate        | 1e-06        |
|    loss                 | 388          |
|    n_updates            | 26320        |
|    policy_gradient_loss | -0.000426    |
|    value_loss           | 1.03e+03     |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.14e+03    |
|    ep_rew_mean          | 2.02e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1469        |
|    time_elapsed         | 6408        |
|    total_timesteps      | 752128      |
| train/                  |             |
|    approx_kl            | 0.004548206 |
|    clip_fraction        | 0.0498      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.62       |
|    explained_variance   | 0.785       |
|    learning_rate        | 1e-06       |
|    loss                 | 171         |
|    n_updates            | 26420       |
|    policy_gradient_loss | -0.0055     |
|    value_loss           | 315         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.17e+03     |
|    ep_rew_mean          | 2.05e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1479         |
|    time_elapsed         | 6452         |
|    total_timesteps      | 757248       |
| train/                  |              |
|    approx_kl            | 0.0015010483 |
|    clip_fraction        | 0.0129       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.308       |
|    explained_variance   | 0.888        |
|    learning_rate        | 1e-06        |
|    loss                 | 87.3         |
|    n_updates            | 26520        |
|    policy_gradient_loss | -0.00177     |
|    value_loss           | 162          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.19e+03     |
|    ep_rew_mean          | 2.07e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1489         |
|    time_elapsed         | 6496         |
|    total_timesteps      | 762368       |
| train/                  |              |
|    approx_kl            | 0.0039347913 |
|    clip_fraction        | 0.0326       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.359       |
|    explained_variance   | 0.824        |
|    learning_rate        | 1e-06        |
|    loss                 | 33.4         |
|    n_updates            | 26620        |
|    policy_gradient_loss | -0.0043      |
|    value_loss           | 163          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.17e+03      |
|    ep_rew_mean          | 2.02e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1499          |
|    time_elapsed         | 6539          |
|    total_timesteps      | 767488        |
| train/                  |               |
|    approx_kl            | 0.00068990584 |
|    clip_fraction        | 0.00215       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.359        |
|    explained_variance   | 0.893         |
|    learning_rate        | 1e-06         |
|    loss                 | 189           |
|    n_updates            | 26720         |
|    policy_gradient_loss | 0.00282       |
|    value_loss           | 298           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.18e+03     |
|    ep_rew_mean          | 2.03e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1509         |
|    time_elapsed         | 6583         |
|    total_timesteps      | 772608       |
| train/                  |              |
|    approx_kl            | 0.0011296372 |
|    clip_fraction        | 0.00703      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.324       |
|    explained_variance   | 0.748        |
|    learning_rate        | 1e-06        |
|    loss                 | 88.3         |
|    n_updates            | 26820        |
|    policy_gradient_loss | -0.000496    |
|    value_loss           | 178          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.17e+03    |
|    ep_rew_mean          | 2.03e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1519        |
|    time_elapsed         | 6626        |
|    total_timesteps      | 777728      |
| train/                  |             |
|    approx_kl            | 0.005074365 |
|    clip_fraction        | 0.0184      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.603      |
|    explained_variance   | 0.68        |
|    learning_rate        | 1e-06       |
|    loss                 | 177         |
|    n_updates            | 26920       |
|    policy_gradient_loss | -0.00741    |
|    value_loss           | 731         |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.14e+03    |
|    ep_rew_mean          | 2.01e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1529        |
|    time_elapsed         | 6670        |
|    total_timesteps      | 782848      |
| train/                  |             |
|    approx_kl            | 0.000987839 |
|    clip_fraction        | 0.00352     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.373      |
|    explained_variance   | 0.798       |
|    learning_rate        | 1e-06       |
|    loss                 | 76.3        |
|    n_updates            | 27020       |
|    policy_gradient_loss | -0.00134    |
|    value_loss           | 198         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.14e+03      |
|    ep_rew_mean          | 2e+03         |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1539          |
|    time_elapsed         | 6714          |
|    total_timesteps      | 787968        |
| train/                  |               |
|    approx_kl            | 0.00069089327 |
|    clip_fraction        | 0.00234       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.636        |
|    explained_variance   | 0.681         |
|    learning_rate        | 1e-06         |
|    loss                 | 68.9          |
|    n_updates            | 27120         |
|    policy_gradient_loss | -0.00169      |
|    value_loss           | 309           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.15e+03      |
|    ep_rew_mean          | 2.02e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1549          |
|    time_elapsed         | 6758          |
|    total_timesteps      | 793088        |
| train/                  |               |
|    approx_kl            | 0.00028770964 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.416        |
|    explained_variance   | 0.709         |
|    learning_rate        | 1e-06         |
|    loss                 | 90            |
|    n_updates            | 27220         |
|    policy_gradient_loss | -0.000896     |
|    value_loss           | 645           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.15e+03     |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1559         |
|    time_elapsed         | 6801         |
|    total_timesteps      | 798208       |
| train/                  |              |
|    approx_kl            | 0.0023799168 |
|    clip_fraction        | 0.0264       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.251       |
|    explained_variance   | 0.739        |
|    learning_rate        | 1e-06        |
|    loss                 | 863          |
|    n_updates            | 27320        |
|    policy_gradient_loss | -0.00153     |
|    value_loss           | 769          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1569         |
|    time_elapsed         | 6845         |
|    total_timesteps      | 803328       |
| train/                  |              |
|    approx_kl            | 0.0020330893 |
|    clip_fraction        | 0.015        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.644       |
|    explained_variance   | 0.932        |
|    learning_rate        | 1e-06        |
|    loss                 | 27.8         |
|    n_updates            | 27420        |
|    policy_gradient_loss | -0.00155     |
|    value_loss           | 95.8         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1579         |
|    time_elapsed         | 6888         |
|    total_timesteps      | 808448       |
| train/                  |              |
|    approx_kl            | 0.0048275893 |
|    clip_fraction        | 0.0314       |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.08        |
|    explained_variance   | 0.685        |
|    learning_rate        | 1e-06        |
|    loss                 | 519          |
|    n_updates            | 27520        |
|    policy_gradient_loss | -0.000148    |
|    value_loss           | 1.31e+03     |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 1.98e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1589         |
|    time_elapsed         | 6932         |
|    total_timesteps      | 813568       |
| train/                  |              |
|    approx_kl            | 0.0012870036 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.559       |
|    explained_variance   | 0.711        |
|    learning_rate        | 1e-06        |
|    loss                 | 323          |
|    n_updates            | 27620        |
|    policy_gradient_loss | -0.000586    |
|    value_loss           | 457          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 1.98e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1599         |
|    time_elapsed         | 6976         |
|    total_timesteps      | 818688       |
| train/                  |              |
|    approx_kl            | 0.0006284462 |
|    clip_fraction        | 0.000781     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.361       |
|    explained_variance   | 0.542        |
|    learning_rate        | 1e-06        |
|    loss                 | 320          |
|    n_updates            | 27720        |
|    policy_gradient_loss | 0.00408      |
|    value_loss           | 758          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 1.97e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1609         |
|    time_elapsed         | 7019         |
|    total_timesteps      | 823808       |
| train/                  |              |
|    approx_kl            | 0.0012821858 |
|    clip_fraction        | 0.0117       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.502       |
|    explained_variance   | 0.93         |
|    learning_rate        | 1e-06        |
|    loss                 | 65.6         |
|    n_updates            | 27820        |
|    policy_gradient_loss | -0.00207     |
|    value_loss           | 142          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.14e+03      |
|    ep_rew_mean          | 1.98e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1619          |
|    time_elapsed         | 7063          |
|    total_timesteps      | 828928        |
| train/                  |               |
|    approx_kl            | 0.00042148598 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.343        |
|    explained_variance   | 0.834         |
|    learning_rate        | 1e-06         |
|    loss                 | 153           |
|    n_updates            | 27920         |
|    policy_gradient_loss | -0.00104      |
|    value_loss           | 245           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.13e+03     |
|    ep_rew_mean          | 1.99e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1629         |
|    time_elapsed         | 7106         |
|    total_timesteps      | 834048       |
| train/                  |              |
|    approx_kl            | 0.0016989195 |
|    clip_fraction        | 0.0043       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.348       |
|    explained_variance   | 0.846        |
|    learning_rate        | 1e-06        |
|    loss                 | 50.6         |
|    n_updates            | 28020        |
|    policy_gradient_loss | -0.000578    |
|    value_loss           | 129          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.14e+03      |
|    ep_rew_mean          | 2e+03         |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1639          |
|    time_elapsed         | 7151          |
|    total_timesteps      | 839168        |
| train/                  |               |
|    approx_kl            | 0.00031637133 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.341        |
|    explained_variance   | 0.743         |
|    learning_rate        | 1e-06         |
|    loss                 | 276           |
|    n_updates            | 28120         |
|    policy_gradient_loss | -0.000287     |
|    value_loss           | 458           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.15e+03     |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1649         |
|    time_elapsed         | 7194         |
|    total_timesteps      | 844288       |
| train/                  |              |
|    approx_kl            | 0.0031545726 |
|    clip_fraction        | 0.00273      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.743       |
|    explained_variance   | 0.75         |
|    learning_rate        | 1e-06        |
|    loss                 | 386          |
|    n_updates            | 28220        |
|    policy_gradient_loss | -0.000321    |
|    value_loss           | 739          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1659         |
|    time_elapsed         | 7238         |
|    total_timesteps      | 849408       |
| train/                  |              |
|    approx_kl            | 0.0019172318 |
|    clip_fraction        | 0.00762      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.296       |
|    explained_variance   | 0.873        |
|    learning_rate        | 1e-06        |
|    loss                 | 111          |
|    n_updates            | 28320        |
|    policy_gradient_loss | -0.00153     |
|    value_loss           | 192          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.15e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1669         |
|    time_elapsed         | 7282         |
|    total_timesteps      | 854528       |
| train/                  |              |
|    approx_kl            | 0.0012512153 |
|    clip_fraction        | 0.00352      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.22        |
|    explained_variance   | 0.808        |
|    learning_rate        | 1e-06        |
|    loss                 | 39.8         |
|    n_updates            | 28420        |
|    policy_gradient_loss | -0.00112     |
|    value_loss           | 101          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.14e+03      |
|    ep_rew_mean          | 1.99e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1679          |
|    time_elapsed         | 7326          |
|    total_timesteps      | 859648        |
| train/                  |               |
|    approx_kl            | 0.00016459695 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.18         |
|    explained_variance   | 0.737         |
|    learning_rate        | 1e-06         |
|    loss                 | 290           |
|    n_updates            | 28520         |
|    policy_gradient_loss | 4.94e-05      |
|    value_loss           | 569           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.15e+03     |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1689         |
|    time_elapsed         | 7369         |
|    total_timesteps      | 864768       |
| train/                  |              |
|    approx_kl            | 0.0002018928 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.219       |
|    explained_variance   | 0.869        |
|    learning_rate        | 1e-06        |
|    loss                 | 79.8         |
|    n_updates            | 28620        |
|    policy_gradient_loss | -0.000927    |
|    value_loss           | 138          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.09e+03      |
|    ep_rew_mean          | 1.93e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1699          |
|    time_elapsed         | 7413          |
|    total_timesteps      | 869888        |
| train/                  |               |
|    approx_kl            | 0.00055260747 |
|    clip_fraction        | 0.00527       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.182        |
|    explained_variance   | 0.344         |
|    learning_rate        | 1e-06         |
|    loss                 | 361           |
|    n_updates            | 28720         |
|    policy_gradient_loss | -0.000415     |
|    value_loss           | 842           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 1.95e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1709         |
|    time_elapsed         | 7457         |
|    total_timesteps      | 875008       |
| train/                  |              |
|    approx_kl            | 0.0009212557 |
|    clip_fraction        | 0.00625      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.186       |
|    explained_variance   | 0.528        |
|    learning_rate        | 1e-06        |
|    loss                 | 428          |
|    n_updates            | 28820        |
|    policy_gradient_loss | -0.00253     |
|    value_loss           | 764          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1719         |
|    time_elapsed         | 7501         |
|    total_timesteps      | 880128       |
| train/                  |              |
|    approx_kl            | 0.0030185767 |
|    clip_fraction        | 0.0139       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.486       |
|    explained_variance   | 0.963        |
|    learning_rate        | 1e-06        |
|    loss                 | 76.2         |
|    n_updates            | 28920        |
|    policy_gradient_loss | -0.00296     |
|    value_loss           | 132          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.09e+03    |
|    ep_rew_mean          | 1.93e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1729        |
|    time_elapsed         | 7544        |
|    total_timesteps      | 885248      |
| train/                  |             |
|    approx_kl            | 0.001250602 |
|    clip_fraction        | 0.0129      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.216      |
|    explained_variance   | 0.504       |
|    learning_rate        | 1e-06       |
|    loss                 | 454         |
|    n_updates            | 29020       |
|    policy_gradient_loss | -0.000826   |
|    value_loss           | 764         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1739         |
|    time_elapsed         | 7588         |
|    total_timesteps      | 890368       |
| train/                  |              |
|    approx_kl            | 0.0019900957 |
|    clip_fraction        | 0.0111       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.359       |
|    explained_variance   | 0.851        |
|    learning_rate        | 1e-06        |
|    loss                 | 53.1         |
|    n_updates            | 29120        |
|    policy_gradient_loss | -0.000675    |
|    value_loss           | 205          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 1.95e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1749         |
|    time_elapsed         | 7631         |
|    total_timesteps      | 895488       |
| train/                  |              |
|    approx_kl            | 0.0016345431 |
|    clip_fraction        | 0.00391      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.396       |
|    explained_variance   | 0.901        |
|    learning_rate        | 1e-06        |
|    loss                 | 50           |
|    n_updates            | 29220        |
|    policy_gradient_loss | -0.0017      |
|    value_loss           | 114          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1759         |
|    time_elapsed         | 7675         |
|    total_timesteps      | 900608       |
| train/                  |              |
|    approx_kl            | 0.0028774955 |
|    clip_fraction        | 0.0191       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.444       |
|    explained_variance   | 0.852        |
|    learning_rate        | 1e-06        |
|    loss                 | 109          |
|    n_updates            | 29320        |
|    policy_gradient_loss | -0.00153     |
|    value_loss           | 201          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 1.97e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1769         |
|    time_elapsed         | 7718         |
|    total_timesteps      | 905728       |
| train/                  |              |
|    approx_kl            | 9.419385e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.279       |
|    explained_variance   | 0.934        |
|    learning_rate        | 1e-06        |
|    loss                 | 62.1         |
|    n_updates            | 29420        |
|    policy_gradient_loss | -0.000248    |
|    value_loss           | 139          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 1.97e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1779         |
|    time_elapsed         | 7763         |
|    total_timesteps      | 910848       |
| train/                  |              |
|    approx_kl            | 0.0016049944 |
|    clip_fraction        | 0.0043       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.485       |
|    explained_variance   | 0.953        |
|    learning_rate        | 1e-06        |
|    loss                 | 68.4         |
|    n_updates            | 29520        |
|    policy_gradient_loss | -0.0024      |
|    value_loss           | 147          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1789         |
|    time_elapsed         | 7806         |
|    total_timesteps      | 915968       |
| train/                  |              |
|    approx_kl            | 0.0007443484 |
|    clip_fraction        | 0.017        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.484       |
|    explained_variance   | 0.747        |
|    learning_rate        | 1e-06        |
|    loss                 | 156          |
|    n_updates            | 29620        |
|    policy_gradient_loss | -0.00141     |
|    value_loss           | 626          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

--------------------------------------------
| rollout/                |                |
|    ep_len_mean          | 1.11e+03       |
|    ep_rew_mean          | 1.95e+03       |
| time/                   |                |
|    fps                  | 117            |
|    iterations           | 1799           |
|    time_elapsed         | 7850           |
|    total_timesteps      | 921088         |
| train/                  |                |
|    approx_kl            | 0.000117898686 |
|    clip_fraction        | 0.0129         |
|    clip_range           | 0.2            |
|    entropy_loss         | -0.324         |
|    explained_variance   | 0.55           |
|    learning_rate        | 1e-06          |
|    loss                 | 286            |
|    n_updates            | 29720          |
|    policy_gradient_loss | 0.000313       |
|    value_loss           | 776            |
--------------------------------------------
------------------------------------------
| rollout/  

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.12e+03      |
|    ep_rew_mean          | 1.97e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1808          |
|    time_elapsed         | 7888          |
|    total_timesteps      | 925696        |
| train/                  |               |
|    approx_kl            | 0.00025658717 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.388        |
|    explained_variance   | 0.906         |
|    learning_rate        | 1e-06         |
|    loss                 | 110           |
|    n_updates            | 29810         |
|    policy_gradient_loss | 0.000673      |
|    value_loss           | 177           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.13e+03      |
|    ep_rew_mean          | 1.98e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1818          |
|    time_elapsed         | 7933          |
|    total_timesteps      | 930816        |
| train/                  |               |
|    approx_kl            | 0.00079214305 |
|    clip_fraction        | 0.000977      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.34         |
|    explained_variance   | 0.878         |
|    learning_rate        | 1e-06         |
|    loss                 | 88.6          |
|    n_updates            | 29910         |
|    policy_gradient_loss | -0.0041       |
|    value_loss           | 164           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 1.98e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1828         |
|    time_elapsed         | 7976         |
|    total_timesteps      | 935936       |
| train/                  |              |
|    approx_kl            | 0.0019603148 |
|    clip_fraction        | 0.0146       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.211       |
|    explained_variance   | 0.503        |
|    learning_rate        | 1e-06        |
|    loss                 | 315          |
|    n_updates            | 30010        |
|    policy_gradient_loss | -0.00364     |
|    value_loss           | 769          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.12e+03      |
|    ep_rew_mean          | 1.98e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1838          |
|    time_elapsed         | 8020          |
|    total_timesteps      | 941056        |
| train/                  |               |
|    approx_kl            | 0.00091321405 |
|    clip_fraction        | 0.00254       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.254        |
|    explained_variance   | 0.81          |
|    learning_rate        | 1e-06         |
|    loss                 | 86.6          |
|    n_updates            | 30110         |
|    policy_gradient_loss | -0.00217      |
|    value_loss           | 180           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 1.98e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1847         |
|    time_elapsed         | 8059         |
|    total_timesteps      | 945664       |
| train/                  |              |
|    approx_kl            | 0.0033009362 |
|    clip_fraction        | 0.0172       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.758       |
|    explained_variance   | 0.842        |
|    learning_rate        | 1e-06        |
|    loss                 | 83           |
|    n_updates            | 30200        |
|    policy_gradient_loss | -0.000127    |
|    value_loss           | 329          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1857         |
|    time_elapsed         | 8103         |
|    total_timesteps      | 950784       |
| train/                  |              |
|    approx_kl            | 0.0011467295 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.454       |
|    explained_variance   | 0.944        |
|    learning_rate        | 1e-06        |
|    loss                 | 54.6         |
|    n_updates            | 30300        |
|    policy_gradient_loss | -0.000494    |
|    value_loss           | 213          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1867         |
|    time_elapsed         | 8146         |
|    total_timesteps      | 955904       |
| train/                  |              |
|    approx_kl            | 0.0017795286 |
|    clip_fraction        | 0.00937      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.336       |
|    explained_variance   | 0.828        |
|    learning_rate        | 1e-06        |
|    loss                 | 73.1         |
|    n_updates            | 30400        |
|    policy_gradient_loss | -0.00106     |
|    value_loss           | 180          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1877         |
|    time_elapsed         | 8190         |
|    total_timesteps      | 961024       |
| train/                  |              |
|    approx_kl            | 0.0016480386 |
|    clip_fraction        | 0.0305       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.351       |
|    explained_variance   | 0.843        |
|    learning_rate        | 1e-06        |
|    loss                 | 91.5         |
|    n_updates            | 30500        |
|    policy_gradient_loss | -0.000511    |
|    value_loss           | 191          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 1.95e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1887         |
|    time_elapsed         | 8234         |
|    total_timesteps      | 966144       |
| train/                  |              |
|    approx_kl            | 0.0012228881 |
|    clip_fraction        | 0.00391      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.327       |
|    explained_variance   | 0.583        |
|    learning_rate        | 1e-06        |
|    loss                 | 211          |
|    n_updates            | 30600        |
|    policy_gradient_loss | 0.00116      |
|    value_loss           | 516          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.94e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1897          |
|    time_elapsed         | 8278          |
|    total_timesteps      | 971264        |
| train/                  |               |
|    approx_kl            | 0.00041913625 |
|    clip_fraction        | 0.00293       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.193        |
|    explained_variance   | 0.767         |
|    learning_rate        | 1e-06         |
|    loss                 | 53.1          |
|    n_updates            | 30700         |
|    policy_gradient_loss | 0.000208      |
|    value_loss           | 154           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1907         |
|    time_elapsed         | 8321         |
|    total_timesteps      | 976384       |
| train/                  |              |
|    approx_kl            | 0.0011955647 |
|    clip_fraction        | 0.00957      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.233       |
|    explained_variance   | 0.922        |
|    learning_rate        | 1e-06        |
|    loss                 | 45.1         |
|    n_updates            | 30800        |
|    policy_gradient_loss | -0.00254     |
|    value_loss           | 128          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 1.97e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1917         |
|    time_elapsed         | 8365         |
|    total_timesteps      | 981504       |
| train/                  |              |
|    approx_kl            | 0.0013634171 |
|    clip_fraction        | 0.00859      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.314       |
|    explained_variance   | 0.583        |
|    learning_rate        | 1e-06        |
|    loss                 | 611          |
|    n_updates            | 30900        |
|    policy_gradient_loss | -0.00155     |
|    value_loss           | 901          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.11e+03    |
|    ep_rew_mean          | 2.01e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1927        |
|    time_elapsed         | 8408        |
|    total_timesteps      | 986624      |
| train/                  |             |
|    approx_kl            | 0.002506988 |
|    clip_fraction        | 0.0139      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.486      |
|    explained_variance   | 0.805       |
|    learning_rate        | 1e-06       |
|    loss                 | 62.1        |
|    n_updates            | 31000       |
|    policy_gradient_loss | -0.00173    |
|    value_loss           | 146         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.11e+03      |
|    ep_rew_mean          | 2.01e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1937          |
|    time_elapsed         | 8452          |
|    total_timesteps      | 991744        |
| train/                  |               |
|    approx_kl            | 0.00047454948 |
|    clip_fraction        | 0.00762       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.412        |
|    explained_variance   | 0.787         |
|    learning_rate        | 1e-06         |
|    loss                 | 120           |
|    n_updates            | 31100         |
|    policy_gradient_loss | 4.5e-05       |
|    value_loss           | 270           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.11e+03    |
|    ep_rew_mean          | 2.04e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1947        |
|    time_elapsed         | 8495        |
|    total_timesteps      | 996864      |
| train/                  |             |
|    approx_kl            | 0.005502876 |
|    clip_fraction        | 0.0424      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.404      |
|    explained_variance   | 0.471       |
|    learning_rate        | 1e-06       |
|    loss                 | 465         |
|    n_updates            | 31200       |
|    policy_gradient_loss | -0.0117     |
|    value_loss           | 761         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.13e+03    |
|    ep_rew_mean          | 2.06e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1957        |
|    time_elapsed         | 8539        |
|    total_timesteps      | 1001984     |
| train/                  |             |
|    approx_kl            | 0.001118244 |
|    clip_fraction        | 0.0104      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.397      |
|    explained_variance   | 0.479       |
|    learning_rate        | 1e-06       |
|    loss                 | 316         |
|    n_updates            | 31300       |
|    policy_gradient_loss | -0.00533    |
|    value_loss           | 814         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.13

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 2.05e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1967         |
|    time_elapsed         | 8582         |
|    total_timesteps      | 1007104      |
| train/                  |              |
|    approx_kl            | 0.0014838703 |
|    clip_fraction        | 0.0176       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.238       |
|    explained_variance   | 0.709        |
|    learning_rate        | 1e-06        |
|    loss                 | 55           |
|    n_updates            | 31400        |
|    policy_gradient_loss | -0.00169     |
|    value_loss           | 126          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.12e+03    |
|    ep_rew_mean          | 2.06e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 1977        |
|    time_elapsed         | 8626        |
|    total_timesteps      | 1012224     |
| train/                  |             |
|    approx_kl            | 0.004417921 |
|    clip_fraction        | 0.0252      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.281      |
|    explained_variance   | 0.897       |
|    learning_rate        | 1e-06       |
|    loss                 | 42          |
|    n_updates            | 31500       |
|    policy_gradient_loss | -0.00424    |
|    value_loss           | 119         |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 2.05e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 1987         |
|    time_elapsed         | 8670         |
|    total_timesteps      | 1017344      |
| train/                  |              |
|    approx_kl            | 0.0047096885 |
|    clip_fraction        | 0.00332      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.931       |
|    explained_variance   | 0.772        |
|    learning_rate        | 1e-06        |
|    loss                 | 43.9         |
|    n_updates            | 31600        |
|    policy_gradient_loss | -0.000621    |
|    value_loss           | 148          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.14e+03      |
|    ep_rew_mean          | 2.07e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 1997          |
|    time_elapsed         | 8714          |
|    total_timesteps      | 1022464       |
| train/                  |               |
|    approx_kl            | 0.00012185937 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.257        |
|    explained_variance   | 0.224         |
|    learning_rate        | 1e-06         |
|    loss                 | 631           |
|    n_updates            | 31700         |
|    policy_gradient_loss | 0.00131       |
|    value_loss           | 877           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14e+03     |
|    ep_rew_mean          | 2.09e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2006         |
|    time_elapsed         | 8753         |
|    total_timesteps      | 1027072      |
| train/                  |              |
|    approx_kl            | 0.0004683527 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.329       |
|    explained_variance   | 0.823        |
|    learning_rate        | 1e-06        |
|    loss                 | 65.2         |
|    n_updates            | 31790        |
|    policy_gradient_loss | 6.14e-05     |
|    value_loss           | 180          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 2.06e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2016         |
|    time_elapsed         | 8798         |
|    total_timesteps      | 1032192      |
| train/                  |              |
|    approx_kl            | 0.0022715323 |
|    clip_fraction        | 0.0262       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.286       |
|    explained_variance   | 0.577        |
|    learning_rate        | 1e-06        |
|    loss                 | 209          |
|    n_updates            | 31890        |
|    policy_gradient_loss | -0.00274     |
|    value_loss           | 859          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.12e+03      |
|    ep_rew_mean          | 2.06e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2025          |
|    time_elapsed         | 8836          |
|    total_timesteps      | 1036800       |
| train/                  |               |
|    approx_kl            | 0.00027643505 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.304        |
|    explained_variance   | 0.745         |
|    learning_rate        | 1e-06         |
|    loss                 | 170           |
|    n_updates            | 31980         |
|    policy_gradient_loss | -0.000867     |
|    value_loss           | 170           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.11e+03      |
|    ep_rew_mean          | 2.04e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2035          |
|    time_elapsed         | 8881          |
|    total_timesteps      | 1041920       |
| train/                  |               |
|    approx_kl            | 0.00016203371 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.225        |
|    explained_variance   | 0.9           |
|    learning_rate        | 1e-06         |
|    loss                 | 49.8          |
|    n_updates            | 32080         |
|    policy_gradient_loss | -0.000243     |
|    value_loss           | 194           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 2.05e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2045         |
|    time_elapsed         | 8924         |
|    total_timesteps      | 1047040      |
| train/                  |              |
|    approx_kl            | 0.0038389433 |
|    clip_fraction        | 0.00742      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.647       |
|    explained_variance   | 0.893        |
|    learning_rate        | 1e-06        |
|    loss                 | 114          |
|    n_updates            | 32180        |
|    policy_gradient_loss | -0.00133     |
|    value_loss           | 452          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.09e+03    |
|    ep_rew_mean          | 2.02e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2055        |
|    time_elapsed         | 8968        |
|    total_timesteps      | 1052160     |
| train/                  |             |
|    approx_kl            | 0.007550785 |
|    clip_fraction        | 0.0422      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.704      |
|    explained_variance   | 0.925       |
|    learning_rate        | 1e-06       |
|    loss                 | 38.8        |
|    n_updates            | 32280       |
|    policy_gradient_loss | -0.00191    |
|    value_loss           | 200         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.1e+0

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 2.03e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2065         |
|    time_elapsed         | 9011         |
|    total_timesteps      | 1057280      |
| train/                  |              |
|    approx_kl            | 0.0018741749 |
|    clip_fraction        | 0.00996      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.336       |
|    explained_variance   | 0.704        |
|    learning_rate        | 1e-06        |
|    loss                 | 109          |
|    n_updates            | 32380        |
|    policy_gradient_loss | 0.000935     |
|    value_loss           | 559          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 2.04e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2075         |
|    time_elapsed         | 9055         |
|    total_timesteps      | 1062400      |
| train/                  |              |
|    approx_kl            | 0.0046231598 |
|    clip_fraction        | 0.0324       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.391       |
|    explained_variance   | 0.929        |
|    learning_rate        | 1e-06        |
|    loss                 | 93.4         |
|    n_updates            | 32480        |
|    policy_gradient_loss | -0.00579     |
|    value_loss           | 240          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 2.04e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2085         |
|    time_elapsed         | 9098         |
|    total_timesteps      | 1067520      |
| train/                  |              |
|    approx_kl            | 0.0011712655 |
|    clip_fraction        | 0.00449      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.194       |
|    explained_variance   | 0.766        |
|    learning_rate        | 1e-06        |
|    loss                 | 218          |
|    n_updates            | 32580        |
|    policy_gradient_loss | -0.00156     |
|    value_loss           | 517          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2095         |
|    time_elapsed         | 9142         |
|    total_timesteps      | 1072640      |
| train/                  |              |
|    approx_kl            | 0.0010995886 |
|    clip_fraction        | 0.00332      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.272       |
|    explained_variance   | 0.572        |
|    learning_rate        | 1e-06        |
|    loss                 | 65.2         |
|    n_updates            | 32680        |
|    policy_gradient_loss | -6.27e-06    |
|    value_loss           | 206          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2105         |
|    time_elapsed         | 9186         |
|    total_timesteps      | 1077760      |
| train/                  |              |
|    approx_kl            | 0.0004467842 |
|    clip_fraction        | 0.00313      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.278       |
|    explained_variance   | 0.828        |
|    learning_rate        | 1e-06        |
|    loss                 | 73.4         |
|    n_updates            | 32780        |
|    policy_gradient_loss | -0.000182    |
|    value_loss           | 173          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.11e+03    |
|    ep_rew_mean          | 2.04e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2115        |
|    time_elapsed         | 9230        |
|    total_timesteps      | 1082880     |
| train/                  |             |
|    approx_kl            | 0.003630721 |
|    clip_fraction        | 0.0256      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.688      |
|    explained_variance   | 0.975       |
|    learning_rate        | 1e-06       |
|    loss                 | 26.2        |
|    n_updates            | 32880       |
|    policy_gradient_loss | -0.00355    |
|    value_loss           | 106         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.11e+

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.12e+03    |
|    ep_rew_mean          | 2.03e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2125        |
|    time_elapsed         | 9273        |
|    total_timesteps      | 1088000     |
| train/                  |             |
|    approx_kl            | 0.004030745 |
|    clip_fraction        | 0.034       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.367      |
|    explained_variance   | 0.722       |
|    learning_rate        | 1e-06       |
|    loss                 | 386         |
|    n_updates            | 32980       |
|    policy_gradient_loss | -0.00398    |
|    value_loss           | 513         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.12e+

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.1e+03     |
|    ep_rew_mean          | 2e+03       |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2135        |
|    time_elapsed         | 9317        |
|    total_timesteps      | 1093120     |
| train/                  |             |
|    approx_kl            | 0.007229965 |
|    clip_fraction        | 0.0836      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.528      |
|    explained_variance   | 0.28        |
|    learning_rate        | 1e-06       |
|    loss                 | 412         |
|    n_updates            | 33080       |
|    policy_gradient_loss | -0.000349   |
|    value_loss           | 873         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 1.98e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2145         |
|    time_elapsed         | 9361         |
|    total_timesteps      | 1098240      |
| train/                  |              |
|    approx_kl            | 0.0002645069 |
|    clip_fraction        | 0.000195     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.364       |
|    explained_variance   | 0.789        |
|    learning_rate        | 1e-06        |
|    loss                 | 40.5         |
|    n_updates            | 33180        |
|    policy_gradient_loss | -0.00136     |
|    value_loss           | 133          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.08e+03      |
|    ep_rew_mean          | 1.96e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2155          |
|    time_elapsed         | 9405          |
|    total_timesteps      | 1103360       |
| train/                  |               |
|    approx_kl            | 0.00057803956 |
|    clip_fraction        | 0.000586      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.337        |
|    explained_variance   | 0.473         |
|    learning_rate        | 1e-06         |
|    loss                 | 720           |
|    n_updates            | 33280         |
|    policy_gradient_loss | -0.000461     |
|    value_loss           | 999           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06e+03     |
|    ep_rew_mean          | 1.91e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2165         |
|    time_elapsed         | 9448         |
|    total_timesteps      | 1108480      |
| train/                  |              |
|    approx_kl            | 0.0027035763 |
|    clip_fraction        | 0.0254       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.575       |
|    explained_variance   | 0.716        |
|    learning_rate        | 1e-06        |
|    loss                 | 177          |
|    n_updates            | 33380        |
|    policy_gradient_loss | -0.000709    |
|    value_loss           | 386          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.05e+03      |
|    ep_rew_mean          | 1.88e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2175          |
|    time_elapsed         | 9492          |
|    total_timesteps      | 1113600       |
| train/                  |               |
|    approx_kl            | 0.00028819242 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.32         |
|    explained_variance   | 0.786         |
|    learning_rate        | 1e-06         |
|    loss                 | 416           |
|    n_updates            | 33480         |
|    policy_gradient_loss | -0.00041      |
|    value_loss           | 462           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 993          |
|    ep_rew_mean          | 1.82e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2185         |
|    time_elapsed         | 9536         |
|    total_timesteps      | 1118720      |
| train/                  |              |
|    approx_kl            | 0.0012255214 |
|    clip_fraction        | 0.00742      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.291       |
|    explained_variance   | 0.814        |
|    learning_rate        | 1e-06        |
|    loss                 | 52.8         |
|    n_updates            | 33580        |
|    policy_gradient_loss | -0.0015      |
|    value_loss           | 131          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 995          |
|    ep_rew_mean          | 1.82e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2195         |
|    time_elapsed         | 9579         |
|    total_timesteps      | 1123840      |
| train/                  |              |
|    approx_kl            | 0.0019219305 |
|    clip_fraction        | 0.0332       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.283       |
|    explained_variance   | 0.544        |
|    learning_rate        | 1e-06        |
|    loss                 | 342          |
|    n_updates            | 33680        |
|    policy_gradient_loss | -0.00237     |
|    value_loss           | 837          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1e+03        |
|    ep_rew_mean          | 1.82e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2205         |
|    time_elapsed         | 9623         |
|    total_timesteps      | 1128960      |
| train/                  |              |
|    approx_kl            | 0.0024364693 |
|    clip_fraction        | 0.0209       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.219       |
|    explained_variance   | 0.658        |
|    learning_rate        | 1e-06        |
|    loss                 | 119          |
|    n_updates            | 33780        |
|    policy_gradient_loss | -0.00173     |
|    value_loss           | 753          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1e+03         |
|    ep_rew_mean          | 1.82e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2215          |
|    time_elapsed         | 9667          |
|    total_timesteps      | 1134080       |
| train/                  |               |
|    approx_kl            | 0.00088321103 |
|    clip_fraction        | 0.00234       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.332        |
|    explained_variance   | 0.925         |
|    learning_rate        | 1e-06         |
|    loss                 | 39.9          |
|    n_updates            | 33880         |
|    policy_gradient_loss | 0.000346      |
|    value_loss           | 129           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.01e+03      |
|    ep_rew_mean          | 1.83e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2225          |
|    time_elapsed         | 9711          |
|    total_timesteps      | 1139200       |
| train/                  |               |
|    approx_kl            | 0.00021333713 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.177        |
|    explained_variance   | 0.683         |
|    learning_rate        | 1e-06         |
|    loss                 | 239           |
|    n_updates            | 33980         |
|    policy_gradient_loss | 0.000594      |
|    value_loss           | 520           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.01e+03      |
|    ep_rew_mean          | 1.82e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2235          |
|    time_elapsed         | 9754          |
|    total_timesteps      | 1144320       |
| train/                  |               |
|    approx_kl            | 0.00025983818 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.207        |
|    explained_variance   | 0.86          |
|    learning_rate        | 1e-06         |
|    loss                 | 119           |
|    n_updates            | 34080         |
|    policy_gradient_loss | -0.000661     |
|    value_loss           | 244           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.01e+03    |
|    ep_rew_mean          | 1.82e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2245        |
|    time_elapsed         | 9798        |
|    total_timesteps      | 1149440     |
| train/                  |             |
|    approx_kl            | 0.001394995 |
|    clip_fraction        | 0.0285      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.234      |
|    explained_variance   | 0.668       |
|    learning_rate        | 1e-06       |
|    loss                 | 352         |
|    n_updates            | 34180       |
|    policy_gradient_loss | -0.00402    |
|    value_loss           | 834         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.01

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.85e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2255         |
|    time_elapsed         | 9841         |
|    total_timesteps      | 1154560      |
| train/                  |              |
|    approx_kl            | 0.0005144718 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.276       |
|    explained_variance   | 0.855        |
|    learning_rate        | 1e-06        |
|    loss                 | 27.8         |
|    n_updates            | 34280        |
|    policy_gradient_loss | 0.000676     |
|    value_loss           | 68.7         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.02e+03      |
|    ep_rew_mean          | 1.85e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2265          |
|    time_elapsed         | 9885          |
|    total_timesteps      | 1159680       |
| train/                  |               |
|    approx_kl            | 0.00036583818 |
|    clip_fraction        | 0.00117       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.234        |
|    explained_variance   | 0.359         |
|    learning_rate        | 1e-06         |
|    loss                 | 144           |
|    n_updates            | 34380         |
|    policy_gradient_loss | 0.000423      |
|    value_loss           | 764           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.01e+03    |
|    ep_rew_mean          | 1.85e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2275        |
|    time_elapsed         | 9928        |
|    total_timesteps      | 1164800     |
| train/                  |             |
|    approx_kl            | 0.002979248 |
|    clip_fraction        | 0.0082      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.323      |
|    explained_variance   | 0.745       |
|    learning_rate        | 1e-06       |
|    loss                 | 96.9        |
|    n_updates            | 34480       |
|    policy_gradient_loss | -0.000877   |
|    value_loss           | 252         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.01

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.86e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2285         |
|    time_elapsed         | 9972         |
|    total_timesteps      | 1169920      |
| train/                  |              |
|    approx_kl            | 0.0004828826 |
|    clip_fraction        | 0.00117      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.26        |
|    explained_variance   | 0.869        |
|    learning_rate        | 1e-06        |
|    loss                 | 109          |
|    n_updates            | 34580        |
|    policy_gradient_loss | -0.000662    |
|    value_loss           | 212          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.01e+03     |
|    ep_rew_mean          | 1.87e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2295         |
|    time_elapsed         | 10016        |
|    total_timesteps      | 1175040      |
| train/                  |              |
|    approx_kl            | 0.0011750832 |
|    clip_fraction        | 0.00723      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.334       |
|    explained_variance   | 0.366        |
|    learning_rate        | 1e-06        |
|    loss                 | 160          |
|    n_updates            | 34680        |
|    policy_gradient_loss | 0.00314      |
|    value_loss           | 472          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2305         |
|    time_elapsed         | 10060        |
|    total_timesteps      | 1180160      |
| train/                  |              |
|    approx_kl            | 0.0010916241 |
|    clip_fraction        | 0.0305       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.347       |
|    explained_variance   | 0.583        |
|    learning_rate        | 1e-06        |
|    loss                 | 218          |
|    n_updates            | 34780        |
|    policy_gradient_loss | -0.00109     |
|    value_loss           | 664          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.01e+03     |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2315         |
|    time_elapsed         | 10103        |
|    total_timesteps      | 1185280      |
| train/                  |              |
|    approx_kl            | 0.0035296236 |
|    clip_fraction        | 0.0184       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.335       |
|    explained_variance   | 0.893        |
|    learning_rate        | 1e-06        |
|    loss                 | 44           |
|    n_updates            | 34880        |
|    policy_gradient_loss | -0.00117     |
|    value_loss           | 95.8         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.01e+03      |
|    ep_rew_mean          | 1.89e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2325          |
|    time_elapsed         | 10147         |
|    total_timesteps      | 1190400       |
| train/                  |               |
|    approx_kl            | 0.00022751256 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.274        |
|    explained_variance   | 0.825         |
|    learning_rate        | 1e-06         |
|    loss                 | 75.1          |
|    n_updates            | 34980         |
|    policy_gradient_loss | -0.000775     |
|    value_loss           | 155           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2335         |
|    time_elapsed         | 10191        |
|    total_timesteps      | 1195520      |
| train/                  |              |
|    approx_kl            | 0.0017346682 |
|    clip_fraction        | 0.00937      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.321       |
|    explained_variance   | 0.831        |
|    learning_rate        | 1e-06        |
|    loss                 | 68.5         |
|    n_updates            | 35080        |
|    policy_gradient_loss | 0.00267      |
|    value_loss           | 383          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.01e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2345         |
|    time_elapsed         | 10235        |
|    total_timesteps      | 1200640      |
| train/                  |              |
|    approx_kl            | 0.0018553342 |
|    clip_fraction        | 0.00137      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.293       |
|    explained_variance   | 0.936        |
|    learning_rate        | 1e-06        |
|    loss                 | 54.7         |
|    n_updates            | 35180        |
|    policy_gradient_loss | -0.000534    |
|    value_loss           | 95.3         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.92e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2355         |
|    time_elapsed         | 10278        |
|    total_timesteps      | 1205760      |
| train/                  |              |
|    approx_kl            | 0.0036658053 |
|    clip_fraction        | 0.0209       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.317       |
|    explained_variance   | 0.874        |
|    learning_rate        | 1e-06        |
|    loss                 | 40.2         |
|    n_updates            | 35280        |
|    policy_gradient_loss | 0.000274     |
|    value_loss           | 121          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2365         |
|    time_elapsed         | 10322        |
|    total_timesteps      | 1210880      |
| train/                  |              |
|    approx_kl            | 0.0013900844 |
|    clip_fraction        | 0.00391      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.423       |
|    explained_variance   | 0.95         |
|    learning_rate        | 1e-06        |
|    loss                 | 75.4         |
|    n_updates            | 35380        |
|    policy_gradient_loss | -0.00188     |
|    value_loss           | 185          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.04e+03      |
|    ep_rew_mean          | 1.95e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2375          |
|    time_elapsed         | 10365         |
|    total_timesteps      | 1216000       |
| train/                  |               |
|    approx_kl            | 0.00036753097 |
|    clip_fraction        | 0.00176       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.226        |
|    explained_variance   | 0.839         |
|    learning_rate        | 1e-06         |
|    loss                 | 42.4          |
|    n_updates            | 35480         |
|    policy_gradient_loss | -0.00304      |
|    value_loss           | 162           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.06e+03      |
|    ep_rew_mean          | 1.99e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2385          |
|    time_elapsed         | 10409         |
|    total_timesteps      | 1221120       |
| train/                  |               |
|    approx_kl            | 0.00048065942 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.338        |
|    explained_variance   | 0.862         |
|    learning_rate        | 1e-06         |
|    loss                 | 60.8          |
|    n_updates            | 35580         |
|    policy_gradient_loss | -0.000381     |
|    value_loss           | 130           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2395         |
|    time_elapsed         | 10453        |
|    total_timesteps      | 1226240      |
| train/                  |              |
|    approx_kl            | 0.0018055897 |
|    clip_fraction        | 0.0187       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.378       |
|    explained_variance   | 0.945        |
|    learning_rate        | 1e-06        |
|    loss                 | 45.3         |
|    n_updates            | 35680        |
|    policy_gradient_loss | -0.00315     |
|    value_loss           | 129          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2405         |
|    time_elapsed         | 10497        |
|    total_timesteps      | 1231360      |
| train/                  |              |
|    approx_kl            | 0.0003240509 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.534       |
|    explained_variance   | 0.948        |
|    learning_rate        | 1e-06        |
|    loss                 | 112          |
|    n_updates            | 35780        |
|    policy_gradient_loss | 0.00116      |
|    value_loss           | 247          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2415         |
|    time_elapsed         | 10542        |
|    total_timesteps      | 1236480      |
| train/                  |              |
|    approx_kl            | 0.0013802841 |
|    clip_fraction        | 0.0186       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.525       |
|    explained_variance   | 0.983        |
|    learning_rate        | 1e-06        |
|    loss                 | 64.7         |
|    n_updates            | 35880        |
|    policy_gradient_loss | -0.00247     |
|    value_loss           | 98.5         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08e+03     |
|    ep_rew_mean          | 2.03e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2425         |
|    time_elapsed         | 10586        |
|    total_timesteps      | 1241600      |
| train/                  |              |
|    approx_kl            | 0.0020784163 |
|    clip_fraction        | 0.0145       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.442       |
|    explained_variance   | 0.758        |
|    learning_rate        | 1e-06        |
|    loss                 | 39.4         |
|    n_updates            | 35980        |
|    policy_gradient_loss | -0.000255    |
|    value_loss           | 270          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.08e+03      |
|    ep_rew_mean          | 2.03e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2435          |
|    time_elapsed         | 10629         |
|    total_timesteps      | 1246720       |
| train/                  |               |
|    approx_kl            | 0.00043860613 |
|    clip_fraction        | 0.00234       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.199        |
|    explained_variance   | 0.796         |
|    learning_rate        | 1e-06         |
|    loss                 | 30.1          |
|    n_updates            | 36080         |
|    policy_gradient_loss | 0.000436      |
|    value_loss           | 114           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2.04e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2444         |
|    time_elapsed         | 10669        |
|    total_timesteps      | 1251328      |
| train/                  |              |
|    approx_kl            | 0.0022559115 |
|    clip_fraction        | 0.017        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.523       |
|    explained_variance   | 0.865        |
|    learning_rate        | 1e-06        |
|    loss                 | 270          |
|    n_updates            | 36170        |
|    policy_gradient_loss | 0.00132      |
|    value_loss           | 557          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.1e+03       |
|    ep_rew_mean          | 2.05e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2454          |
|    time_elapsed         | 10712         |
|    total_timesteps      | 1256448       |
| train/                  |               |
|    approx_kl            | 0.00092759635 |
|    clip_fraction        | 0.00215       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.242        |
|    explained_variance   | 0.49          |
|    learning_rate        | 1e-06         |
|    loss                 | 230           |
|    n_updates            | 36270         |
|    policy_gradient_loss | 0.00224       |
|    value_loss           | 838           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 2.06e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2464         |
|    time_elapsed         | 10756        |
|    total_timesteps      | 1261568      |
| train/                  |              |
|    approx_kl            | 0.0018954884 |
|    clip_fraction        | 0.0314       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.257       |
|    explained_variance   | 0.845        |
|    learning_rate        | 1e-06        |
|    loss                 | 31.6         |
|    n_updates            | 36370        |
|    policy_gradient_loss | -0.00237     |
|    value_loss           | 198          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.08e+03    |
|    ep_rew_mean          | 2.03e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2474        |
|    time_elapsed         | 10799       |
|    total_timesteps      | 1266688     |
| train/                  |             |
|    approx_kl            | 0.006634164 |
|    clip_fraction        | 0.0801      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.461      |
|    explained_variance   | 0.505       |
|    learning_rate        | 1e-06       |
|    loss                 | 208         |
|    n_updates            | 36470       |
|    policy_gradient_loss | -0.00567    |
|    value_loss           | 784         |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2.04e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2483         |
|    time_elapsed         | 10839        |
|    total_timesteps      | 1271296      |
| train/                  |              |
|    approx_kl            | 0.0060276985 |
|    clip_fraction        | 0.0354       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.489       |
|    explained_variance   | 0.635        |
|    learning_rate        | 1e-06        |
|    loss                 | 29.6         |
|    n_updates            | 36560        |
|    policy_gradient_loss | 0.00535      |
|    value_loss           | 155          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.09e+03    |
|    ep_rew_mean          | 2.03e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2493        |
|    time_elapsed         | 10882       |
|    total_timesteps      | 1276416     |
| train/                  |             |
|    approx_kl            | 0.002349001 |
|    clip_fraction        | 0.016       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.458      |
|    explained_variance   | 0.878       |
|    learning_rate        | 1e-06       |
|    loss                 | 44          |
|    n_updates            | 36660       |
|    policy_gradient_loss | -0.00258    |
|    value_loss           | 122         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.09e+

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.09e+03    |
|    ep_rew_mean          | 2.04e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2503        |
|    time_elapsed         | 10926       |
|    total_timesteps      | 1281536     |
| train/                  |             |
|    approx_kl            | 0.003194089 |
|    clip_fraction        | 0.0248      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.298      |
|    explained_variance   | 0.714       |
|    learning_rate        | 1e-06       |
|    loss                 | 35.1        |
|    n_updates            | 36760       |
|    policy_gradient_loss | -0.00223    |
|    value_loss           | 125         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2.03e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2513         |
|    time_elapsed         | 10970        |
|    total_timesteps      | 1286656      |
| train/                  |              |
|    approx_kl            | 0.0019867015 |
|    clip_fraction        | 0.0125       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.213       |
|    explained_variance   | 0.816        |
|    learning_rate        | 1e-06        |
|    loss                 | 61.2         |
|    n_updates            | 36860        |
|    policy_gradient_loss | -0.00254     |
|    value_loss           | 151          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2.03e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2523         |
|    time_elapsed         | 11014        |
|    total_timesteps      | 1291776      |
| train/                  |              |
|    approx_kl            | 0.0008036508 |
|    clip_fraction        | 0.0127       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.22        |
|    explained_variance   | 0.668        |
|    learning_rate        | 1e-06        |
|    loss                 | 239          |
|    n_updates            | 36960        |
|    policy_gradient_loss | -0.00194     |
|    value_loss           | 686          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.09e+03      |
|    ep_rew_mean          | 2.02e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2533          |
|    time_elapsed         | 11057         |
|    total_timesteps      | 1296896       |
| train/                  |               |
|    approx_kl            | 0.00096359977 |
|    clip_fraction        | 0.0154        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.313        |
|    explained_variance   | 0.885         |
|    learning_rate        | 1e-06         |
|    loss                 | 55.6          |
|    n_updates            | 37060         |
|    policy_gradient_loss | -0.00142      |
|    value_loss           | 139           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.09e+03      |
|    ep_rew_mean          | 2.02e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2543          |
|    time_elapsed         | 11102         |
|    total_timesteps      | 1302016       |
| train/                  |               |
|    approx_kl            | 0.00029957446 |
|    clip_fraction        | 0.00254       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.136        |
|    explained_variance   | 0.853         |
|    learning_rate        | 1e-06         |
|    loss                 | 19.8          |
|    n_updates            | 37160         |
|    policy_gradient_loss | -0.00244      |
|    value_loss           | 112           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_rew_mean          | 1.99e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2553         |
|    time_elapsed         | 11145        |
|    total_timesteps      | 1307136      |
| train/                  |              |
|    approx_kl            | 0.0013863088 |
|    clip_fraction        | 0.0041       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.296       |
|    explained_variance   | 0.602        |
|    learning_rate        | 1e-06        |
|    loss                 | 42.1         |
|    n_updates            | 37260        |
|    policy_gradient_loss | 0.00328      |
|    value_loss           | 122          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.06e+03      |
|    ep_rew_mean          | 1.96e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2563          |
|    time_elapsed         | 11189         |
|    total_timesteps      | 1312256       |
| train/                  |               |
|    approx_kl            | 0.00018334226 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.155        |
|    explained_variance   | 0.795         |
|    learning_rate        | 1e-06         |
|    loss                 | 301           |
|    n_updates            | 37360         |
|    policy_gradient_loss | -0.000566     |
|    value_loss           | 448           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.06e+03      |
|    ep_rew_mean          | 1.96e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2572          |
|    time_elapsed         | 11228         |
|    total_timesteps      | 1316864       |
| train/                  |               |
|    approx_kl            | 0.00093215203 |
|    clip_fraction        | 0.00742       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.25         |
|    explained_variance   | 0.593         |
|    learning_rate        | 1e-06         |
|    loss                 | 67.8          |
|    n_updates            | 37450         |
|    policy_gradient_loss | 0.00052       |
|    value_loss           | 311           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.91e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2582         |
|    time_elapsed         | 11272        |
|    total_timesteps      | 1321984      |
| train/                  |              |
|    approx_kl            | 0.0071206964 |
|    clip_fraction        | 0.0367       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.335       |
|    explained_variance   | 0.502        |
|    learning_rate        | 1e-06        |
|    loss                 | 686          |
|    n_updates            | 37550        |
|    policy_gradient_loss | -0.00445     |
|    value_loss           | 613          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.92e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2592         |
|    time_elapsed         | 11315        |
|    total_timesteps      | 1327104      |
| train/                  |              |
|    approx_kl            | 0.0021849223 |
|    clip_fraction        | 0.00586      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.331       |
|    explained_variance   | 0.182        |
|    learning_rate        | 1e-06        |
|    loss                 | 366          |
|    n_updates            | 37650        |
|    policy_gradient_loss | -0.00158     |
|    value_loss           | 1.01e+03     |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.91e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2602         |
|    time_elapsed         | 11360        |
|    total_timesteps      | 1332224      |
| train/                  |              |
|    approx_kl            | 0.0016844128 |
|    clip_fraction        | 0.0121       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.386       |
|    explained_variance   | 0.753        |
|    learning_rate        | 1e-06        |
|    loss                 | 61.5         |
|    n_updates            | 37750        |
|    policy_gradient_loss | -0.00154     |
|    value_loss           | 159          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2612         |
|    time_elapsed         | 11403        |
|    total_timesteps      | 1337344      |
| train/                  |              |
|    approx_kl            | 0.0013311454 |
|    clip_fraction        | 0.00176      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.495       |
|    explained_variance   | 0.959        |
|    learning_rate        | 1e-06        |
|    loss                 | 43.6         |
|    n_updates            | 37850        |
|    policy_gradient_loss | -0.00107     |
|    value_loss           | 143          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2622         |
|    time_elapsed         | 11447        |
|    total_timesteps      | 1342464      |
| train/                  |              |
|    approx_kl            | 0.0025690016 |
|    clip_fraction        | 0.0152       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.551       |
|    explained_variance   | 0.949        |
|    learning_rate        | 1e-06        |
|    loss                 | 41.6         |
|    n_updates            | 37950        |
|    policy_gradient_loss | -0.0016      |
|    value_loss           | 212          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.04e+03    |
|    ep_rew_mean          | 1.94e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2632        |
|    time_elapsed         | 11490       |
|    total_timesteps      | 1347584     |
| train/                  |             |
|    approx_kl            | 0.004060209 |
|    clip_fraction        | 0.0437      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.345      |
|    explained_variance   | 0.767       |
|    learning_rate        | 1e-06       |
|    loss                 | 22.6        |
|    n_updates            | 38050       |
|    policy_gradient_loss | -0.00546    |
|    value_loss           | 76          |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.04e+03    |
|    ep_rew_mean          | 1.95e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2642        |
|    time_elapsed         | 11534       |
|    total_timesteps      | 1352704     |
| train/                  |             |
|    approx_kl            | 0.001224932 |
|    clip_fraction        | 0.00723     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.295      |
|    explained_variance   | 0.905       |
|    learning_rate        | 1e-06       |
|    loss                 | 57.6        |
|    n_updates            | 38150       |
|    policy_gradient_loss | -0.00165    |
|    value_loss           | 118         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.04e+

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.02e+03      |
|    ep_rew_mean          | 1.93e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2652          |
|    time_elapsed         | 11578         |
|    total_timesteps      | 1357824       |
| train/                  |               |
|    approx_kl            | 8.8326284e-05 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.273        |
|    explained_variance   | 0.708         |
|    learning_rate        | 1e-06         |
|    loss                 | 333           |
|    n_updates            | 38250         |
|    policy_gradient_loss | -0.000407     |
|    value_loss           | 516           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2662         |
|    time_elapsed         | 11622        |
|    total_timesteps      | 1362944      |
| train/                  |              |
|    approx_kl            | 0.0023940974 |
|    clip_fraction        | 0.0109       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.371       |
|    explained_variance   | 0.911        |
|    learning_rate        | 1e-06        |
|    loss                 | 32.3         |
|    n_updates            | 38350        |
|    policy_gradient_loss | -0.000588    |
|    value_loss           | 100          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2672         |
|    time_elapsed         | 11665        |
|    total_timesteps      | 1368064      |
| train/                  |              |
|    approx_kl            | 0.0013191405 |
|    clip_fraction        | 0.00781      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.336       |
|    explained_variance   | 0.853        |
|    learning_rate        | 1e-06        |
|    loss                 | 31.7         |
|    n_updates            | 38450        |
|    policy_gradient_loss | -0.00216     |
|    value_loss           | 101          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.95e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2682         |
|    time_elapsed         | 11720        |
|    total_timesteps      | 1373184      |
| train/                  |              |
|    approx_kl            | 0.0021791363 |
|    clip_fraction        | 0.027        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.189       |
|    explained_variance   | 0.581        |
|    learning_rate        | 1e-06        |
|    loss                 | 331          |
|    n_updates            | 38550        |
|    policy_gradient_loss | 0.00354      |
|    value_loss           | 1.02e+03     |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.03e+03      |
|    ep_rew_mean          | 1.95e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2692          |
|    time_elapsed         | 11763         |
|    total_timesteps      | 1378304       |
| train/                  |               |
|    approx_kl            | 0.00013541232 |
|    clip_fraction        | 0.00117       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.3          |
|    explained_variance   | 0.633         |
|    learning_rate        | 1e-06         |
|    loss                 | 457           |
|    n_updates            | 38650         |
|    policy_gradient_loss | -0.000982     |
|    value_loss           | 579           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2702         |
|    time_elapsed         | 11808        |
|    total_timesteps      | 1383424      |
| train/                  |              |
|    approx_kl            | 0.0021065187 |
|    clip_fraction        | 0.00352      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.652       |
|    explained_variance   | 0.937        |
|    learning_rate        | 1e-06        |
|    loss                 | 43.2         |
|    n_updates            | 38750        |
|    policy_gradient_loss | -0.00173     |
|    value_loss           | 245          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.95e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2712         |
|    time_elapsed         | 11851        |
|    total_timesteps      | 1388544      |
| train/                  |              |
|    approx_kl            | 0.0017286221 |
|    clip_fraction        | 0.0121       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.274       |
|    explained_variance   | 0.865        |
|    learning_rate        | 1e-06        |
|    loss                 | 82.2         |
|    n_updates            | 38850        |
|    policy_gradient_loss | -0.0019      |
|    value_loss           | 179          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.04e+03      |
|    ep_rew_mean          | 1.95e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2721          |
|    time_elapsed         | 11891         |
|    total_timesteps      | 1393152       |
| train/                  |               |
|    approx_kl            | 0.00064465625 |
|    clip_fraction        | 0.000977      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.177        |
|    explained_variance   | 0.943         |
|    learning_rate        | 1e-06         |
|    loss                 | 37.9          |
|    n_updates            | 38940         |
|    policy_gradient_loss | -0.000559     |
|    value_loss           | 125           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.03e+03    |
|    ep_rew_mean          | 1.94e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2731        |
|    time_elapsed         | 11934       |
|    total_timesteps      | 1398272     |
| train/                  |             |
|    approx_kl            | 0.003845484 |
|    clip_fraction        | 0.0139      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.511      |
|    explained_variance   | 0.718       |
|    learning_rate        | 1e-06       |
|    loss                 | 251         |
|    n_updates            | 39040       |
|    policy_gradient_loss | -0.00375    |
|    value_loss           | 883         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.03e+

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2741         |
|    time_elapsed         | 11978        |
|    total_timesteps      | 1403392      |
| train/                  |              |
|    approx_kl            | 0.0004932068 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.219       |
|    explained_variance   | 0.835        |
|    learning_rate        | 1e-06        |
|    loss                 | 52.1         |
|    n_updates            | 39140        |
|    policy_gradient_loss | 0.000414     |
|    value_loss           | 193          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.05e+03    |
|    ep_rew_mean          | 1.99e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2751        |
|    time_elapsed         | 12021       |
|    total_timesteps      | 1408512     |
| train/                  |             |
|    approx_kl            | 0.001445764 |
|    clip_fraction        | 0.0117      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.429      |
|    explained_variance   | 0.8         |
|    learning_rate        | 1e-06       |
|    loss                 | 24.4        |
|    n_updates            | 39240       |
|    policy_gradient_loss | 0.000339    |
|    value_loss           | 84.9        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.06e+03      |
|    ep_rew_mean          | 2e+03         |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2761          |
|    time_elapsed         | 12066         |
|    total_timesteps      | 1413632       |
| train/                  |               |
|    approx_kl            | 0.00025689905 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.391        |
|    explained_variance   | 0.908         |
|    learning_rate        | 1e-06         |
|    loss                 | 27            |
|    n_updates            | 39340         |
|    policy_gradient_loss | 6.6e-06       |
|    value_loss           | 131           |
-------------------------------------------
------------------------------------------
| rollout/                |      

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.07e+03   |
|    ep_rew_mean          | 2e+03      |
| time/                   |            |
|    fps                  | 117        |
|    iterations           | 2771       |
|    time_elapsed         | 12110      |
|    total_timesteps      | 1418752    |
| train/                  |            |
|    approx_kl            | 0.00514765 |
|    clip_fraction        | 0.0463     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.386     |
|    explained_variance   | 0.877      |
|    learning_rate        | 1e-06      |
|    loss                 | 57         |
|    n_updates            | 39440      |
|    policy_gradient_loss | -0.000456  |
|    value_loss           | 121        |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_re

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.99e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2781          |
|    time_elapsed         | 12153         |
|    total_timesteps      | 1423872       |
| train/                  |               |
|    approx_kl            | 0.00073056633 |
|    clip_fraction        | 0.00898       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.22         |
|    explained_variance   | 0.856         |
|    learning_rate        | 1e-06         |
|    loss                 | 72.7          |
|    n_updates            | 39540         |
|    policy_gradient_loss | -2.06e-05     |
|    value_loss           | 181           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08e+03     |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2791         |
|    time_elapsed         | 12197        |
|    total_timesteps      | 1428992      |
| train/                  |              |
|    approx_kl            | 0.0049013607 |
|    clip_fraction        | 0.04         |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.336       |
|    explained_variance   | 0.835        |
|    learning_rate        | 1e-06        |
|    loss                 | 78.7         |
|    n_updates            | 39640        |
|    policy_gradient_loss | -0.00561     |
|    value_loss           | 263          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.1e+03       |
|    ep_rew_mean          | 2.05e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2801          |
|    time_elapsed         | 12240         |
|    total_timesteps      | 1434112       |
| train/                  |               |
|    approx_kl            | 0.00047390803 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.267        |
|    explained_variance   | 0.618         |
|    learning_rate        | 1e-06         |
|    loss                 | 250           |
|    n_updates            | 39740         |
|    policy_gradient_loss | 0.000749      |
|    value_loss           | 548           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.1e+03       |
|    ep_rew_mean          | 2.04e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2811          |
|    time_elapsed         | 12285         |
|    total_timesteps      | 1439232       |
| train/                  |               |
|    approx_kl            | 0.00025755877 |
|    clip_fraction        | 0.00273       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.18         |
|    explained_variance   | 0.946         |
|    learning_rate        | 1e-06         |
|    loss                 | 30.3          |
|    n_updates            | 39840         |
|    policy_gradient_loss | -0.000176     |
|    value_loss           | 74.4          |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 2.04e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2821         |
|    time_elapsed         | 12328        |
|    total_timesteps      | 1444352      |
| train/                  |              |
|    approx_kl            | 0.0021583922 |
|    clip_fraction        | 0.0129       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.241       |
|    explained_variance   | 0.86         |
|    learning_rate        | 1e-06        |
|    loss                 | 41.7         |
|    n_updates            | 39940        |
|    policy_gradient_loss | 3.08e-05     |
|    value_loss           | 107          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.09e+03    |
|    ep_rew_mean          | 2.01e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2831        |
|    time_elapsed         | 12372       |
|    total_timesteps      | 1449472     |
| train/                  |             |
|    approx_kl            | 0.008294082 |
|    clip_fraction        | 0.0561      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.383      |
|    explained_variance   | 0.735       |
|    learning_rate        | 1e-06       |
|    loss                 | 39.3        |
|    n_updates            | 40040       |
|    policy_gradient_loss | 0.00679     |
|    value_loss           | 141         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.09e+

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2841         |
|    time_elapsed         | 12415        |
|    total_timesteps      | 1454592      |
| train/                  |              |
|    approx_kl            | 0.0023835078 |
|    clip_fraction        | 0.0191       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.39        |
|    explained_variance   | 0.794        |
|    learning_rate        | 1e-06        |
|    loss                 | 39.4         |
|    n_updates            | 40140        |
|    policy_gradient_loss | -0.00087     |
|    value_loss           | 128          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2851         |
|    time_elapsed         | 12459        |
|    total_timesteps      | 1459712      |
| train/                  |              |
|    approx_kl            | 0.0069015985 |
|    clip_fraction        | 0.0713       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.523       |
|    explained_variance   | 0.954        |
|    learning_rate        | 1e-06        |
|    loss                 | 63.7         |
|    n_updates            | 40240        |
|    policy_gradient_loss | -0.00712     |
|    value_loss           | 197          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2861         |
|    time_elapsed         | 12503        |
|    total_timesteps      | 1464832      |
| train/                  |              |
|    approx_kl            | 0.0024598266 |
|    clip_fraction        | 0.0328       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.422       |
|    explained_variance   | 0.758        |
|    learning_rate        | 1e-06        |
|    loss                 | 40.9         |
|    n_updates            | 40340        |
|    policy_gradient_loss | -0.00097     |
|    value_loss           | 89.2         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.08e+03      |
|    ep_rew_mean          | 1.98e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2871          |
|    time_elapsed         | 12547         |
|    total_timesteps      | 1469952       |
| train/                  |               |
|    approx_kl            | 0.00016477297 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.235        |
|    explained_variance   | 0.625         |
|    learning_rate        | 1e-06         |
|    loss                 | 138           |
|    n_updates            | 40440         |
|    policy_gradient_loss | -0.000699     |
|    value_loss           | 653           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.97e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2881          |
|    time_elapsed         | 12590         |
|    total_timesteps      | 1475072       |
| train/                  |               |
|    approx_kl            | 0.00039297924 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.297        |
|    explained_variance   | 0.903         |
|    learning_rate        | 1e-06         |
|    loss                 | 60.1          |
|    n_updates            | 40540         |
|    policy_gradient_loss | -0.000915     |
|    value_loss           | 156           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_rew_mean          | 1.98e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2891         |
|    time_elapsed         | 12635        |
|    total_timesteps      | 1480192      |
| train/                  |              |
|    approx_kl            | 0.0028428824 |
|    clip_fraction        | 0.0242       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.367       |
|    explained_variance   | 0.74         |
|    learning_rate        | 1e-06        |
|    loss                 | 127          |
|    n_updates            | 40640        |
|    policy_gradient_loss | -0.000296    |
|    value_loss           | 273          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2901         |
|    time_elapsed         | 12679        |
|    total_timesteps      | 1485312      |
| train/                  |              |
|    approx_kl            | 0.0016223253 |
|    clip_fraction        | 0.00859      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.238       |
|    explained_variance   | 0.663        |
|    learning_rate        | 1e-06        |
|    loss                 | 169          |
|    n_updates            | 40740        |
|    policy_gradient_loss | 0.00147      |
|    value_loss           | 468          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11e+03     |
|    ep_rew_mean          | 2.03e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2911         |
|    time_elapsed         | 12723        |
|    total_timesteps      | 1490432      |
| train/                  |              |
|    approx_kl            | 0.0018397456 |
|    clip_fraction        | 0.0158       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.427       |
|    explained_variance   | 0.85         |
|    learning_rate        | 1e-06        |
|    loss                 | 40.9         |
|    n_updates            | 40840        |
|    policy_gradient_loss | -0.00163     |
|    value_loss           | 105          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 2.05e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2921         |
|    time_elapsed         | 12766        |
|    total_timesteps      | 1495552      |
| train/                  |              |
|    approx_kl            | 0.0015642224 |
|    clip_fraction        | 0.0217       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.41        |
|    explained_variance   | 0.904        |
|    learning_rate        | 1e-06        |
|    loss                 | 48.5         |
|    n_updates            | 40940        |
|    policy_gradient_loss | 0.000266     |
|    value_loss           | 249          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.1e+03       |
|    ep_rew_mean          | 2.02e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2931          |
|    time_elapsed         | 12810         |
|    total_timesteps      | 1500672       |
| train/                  |               |
|    approx_kl            | 0.00027885544 |
|    clip_fraction        | 0.000977      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.285        |
|    explained_variance   | 0.756         |
|    learning_rate        | 1e-06         |
|    loss                 | 139           |
|    n_updates            | 41040         |
|    policy_gradient_loss | -0.000927     |
|    value_loss           | 463           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.09e+03      |
|    ep_rew_mean          | 1.99e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2941          |
|    time_elapsed         | 12854         |
|    total_timesteps      | 1505792       |
| train/                  |               |
|    approx_kl            | 0.00018841168 |
|    clip_fraction        | 0.000977      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.189        |
|    explained_variance   | 0.826         |
|    learning_rate        | 1e-06         |
|    loss                 | 103           |
|    n_updates            | 41140         |
|    policy_gradient_loss | -0.000403     |
|    value_loss           | 486           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.96e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 2950          |
|    time_elapsed         | 12894         |
|    total_timesteps      | 1510400       |
| train/                  |               |
|    approx_kl            | 0.00075112015 |
|    clip_fraction        | 0.00469       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.444        |
|    explained_variance   | 0.816         |
|    learning_rate        | 1e-06         |
|    loss                 | 45.3          |
|    n_updates            | 41230         |
|    policy_gradient_loss | -2.68e-05     |
|    value_loss           | 110           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07e+03     |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2960         |
|    time_elapsed         | 12937        |
|    total_timesteps      | 1515520      |
| train/                  |              |
|    approx_kl            | 0.0016818632 |
|    clip_fraction        | 0.00273      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.629       |
|    explained_variance   | 0.935        |
|    learning_rate        | 1e-06        |
|    loss                 | 72.6         |
|    n_updates            | 41330        |
|    policy_gradient_loss | -0.000554    |
|    value_loss           | 240          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.06e+03    |
|    ep_rew_mean          | 1.95e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 2970        |
|    time_elapsed         | 12981       |
|    total_timesteps      | 1520640     |
| train/                  |             |
|    approx_kl            | 0.000504239 |
|    clip_fraction        | 0.00195     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.168      |
|    explained_variance   | 0.849       |
|    learning_rate        | 1e-06       |
|    loss                 | 89.2        |
|    n_updates            | 41430       |
|    policy_gradient_loss | -3.03e-05   |
|    value_loss           | 257         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2980         |
|    time_elapsed         | 13024        |
|    total_timesteps      | 1525760      |
| train/                  |              |
|    approx_kl            | 0.0016451516 |
|    clip_fraction        | 0.00918      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.255       |
|    explained_variance   | 0.697        |
|    learning_rate        | 1e-06        |
|    loss                 | 34.9         |
|    n_updates            | 41530        |
|    policy_gradient_loss | -0.00326     |
|    value_loss           | 182          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06e+03     |
|    ep_rew_mean          | 1.95e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 2990         |
|    time_elapsed         | 13068        |
|    total_timesteps      | 1530880      |
| train/                  |              |
|    approx_kl            | 0.0022498933 |
|    clip_fraction        | 0.016        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.801       |
|    explained_variance   | 0.877        |
|    learning_rate        | 1e-06        |
|    loss                 | 174          |
|    n_updates            | 41630        |
|    policy_gradient_loss | -0.000565    |
|    value_loss           | 468          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05e+03     |
|    ep_rew_mean          | 1.95e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3000         |
|    time_elapsed         | 13111        |
|    total_timesteps      | 1536000      |
| train/                  |              |
|    approx_kl            | 0.0004557653 |
|    clip_fraction        | 0.000977     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.244       |
|    explained_variance   | 0.921        |
|    learning_rate        | 1e-06        |
|    loss                 | 33.9         |
|    n_updates            | 41730        |
|    policy_gradient_loss | -0.000581    |
|    value_loss           | 91.7         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3010         |
|    time_elapsed         | 13156        |
|    total_timesteps      | 1541120      |
| train/                  |              |
|    approx_kl            | 0.0017393623 |
|    clip_fraction        | 0.00625      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.747       |
|    explained_variance   | 0.684        |
|    learning_rate        | 1e-06        |
|    loss                 | 189          |
|    n_updates            | 41830        |
|    policy_gradient_loss | 0.00264      |
|    value_loss           | 929          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06e+03     |
|    ep_rew_mean          | 1.96e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3020         |
|    time_elapsed         | 13199        |
|    total_timesteps      | 1546240      |
| train/                  |              |
|    approx_kl            | 0.0012518371 |
|    clip_fraction        | 0.0229       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.405       |
|    explained_variance   | 0.854        |
|    learning_rate        | 1e-06        |
|    loss                 | 168          |
|    n_updates            | 41930        |
|    policy_gradient_loss | 0.00136      |
|    value_loss           | 385          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06e+03     |
|    ep_rew_mean          | 1.95e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3030         |
|    time_elapsed         | 13243        |
|    total_timesteps      | 1551360      |
| train/                  |              |
|    approx_kl            | 0.0017622672 |
|    clip_fraction        | 0.00586      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.503       |
|    explained_variance   | 0.807        |
|    learning_rate        | 1e-06        |
|    loss                 | 237          |
|    n_updates            | 42030        |
|    policy_gradient_loss | -0.000643    |
|    value_loss           | 419          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.06e+03      |
|    ep_rew_mean          | 1.95e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3040          |
|    time_elapsed         | 13286         |
|    total_timesteps      | 1556480       |
| train/                  |               |
|    approx_kl            | 0.00064274843 |
|    clip_fraction        | 0.00645       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.239        |
|    explained_variance   | 0.868         |
|    learning_rate        | 1e-06         |
|    loss                 | 53.5          |
|    n_updates            | 42130         |
|    policy_gradient_loss | -0.000104     |
|    value_loss           | 124           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3050         |
|    time_elapsed         | 13330        |
|    total_timesteps      | 1561600      |
| train/                  |              |
|    approx_kl            | 0.0010777141 |
|    clip_fraction        | 0.0217       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.251       |
|    explained_variance   | 0.636        |
|    learning_rate        | 1e-06        |
|    loss                 | 167          |
|    n_updates            | 42230        |
|    policy_gradient_loss | -0.00163     |
|    value_loss           | 486          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.04e+03    |
|    ep_rew_mean          | 1.92e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3060        |
|    time_elapsed         | 13374       |
|    total_timesteps      | 1566720     |
| train/                  |             |
|    approx_kl            | 0.004363852 |
|    clip_fraction        | 0.0393      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.48       |
|    explained_variance   | 0.878       |
|    learning_rate        | 1e-06       |
|    loss                 | 153         |
|    n_updates            | 42330       |
|    policy_gradient_loss | -0.00261    |
|    value_loss           | 251         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3070         |
|    time_elapsed         | 13418        |
|    total_timesteps      | 1571840      |
| train/                  |              |
|    approx_kl            | 0.0061951913 |
|    clip_fraction        | 0.0434       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.512       |
|    explained_variance   | 0.47         |
|    learning_rate        | 1e-06        |
|    loss                 | 289          |
|    n_updates            | 42430        |
|    policy_gradient_loss | 0.00182      |
|    value_loss           | 534          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.06e+03    |
|    ep_rew_mean          | 1.95e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3080        |
|    time_elapsed         | 13461       |
|    total_timesteps      | 1576960     |
| train/                  |             |
|    approx_kl            | 0.005542862 |
|    clip_fraction        | 0.0223      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.386      |
|    explained_variance   | 0.839       |
|    learning_rate        | 1e-06       |
|    loss                 | 96.1        |
|    n_updates            | 42530       |
|    policy_gradient_loss | -0.00564    |
|    value_loss           | 230         |
-----------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.06e+03    |
|    ep_rew_mean          | 1.96e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3090        |
|    time_elapsed         | 13505       |
|    total_timesteps      | 1582080     |
| train/                  |             |
|    approx_kl            | 0.004229419 |
|    clip_fraction        | 0.0377      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.328      |
|    explained_variance   | 0.921       |
|    learning_rate        | 1e-06       |
|    loss                 | 32          |
|    n_updates            | 42630       |
|    policy_gradient_loss | -0.00129    |
|    value_loss           | 74.8        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.06

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.06e+03    |
|    ep_rew_mean          | 1.95e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3100        |
|    time_elapsed         | 13549       |
|    total_timesteps      | 1587200     |
| train/                  |             |
|    approx_kl            | 0.001086723 |
|    clip_fraction        | 0.017       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.272      |
|    explained_variance   | 0.851       |
|    learning_rate        | 1e-06       |
|    loss                 | 4.86        |
|    n_updates            | 42730       |
|    policy_gradient_loss | -0.000259   |
|    value_loss           | 32.9        |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.9e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3110         |
|    time_elapsed         | 13593        |
|    total_timesteps      | 1592320      |
| train/                  |              |
|    approx_kl            | 0.0014642125 |
|    clip_fraction        | 0.0129       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.344       |
|    explained_variance   | 0.752        |
|    learning_rate        | 1e-06        |
|    loss                 | 41.9         |
|    n_updates            | 42830        |
|    policy_gradient_loss | -0.000839    |
|    value_loss           | 128          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.01e+03     |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3120         |
|    time_elapsed         | 13636        |
|    total_timesteps      | 1597440      |
| train/                  |              |
|    approx_kl            | 0.0012454478 |
|    clip_fraction        | 0.0152       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.458       |
|    explained_variance   | 0.931        |
|    learning_rate        | 1e-06        |
|    loss                 | 194          |
|    n_updates            | 42930        |
|    policy_gradient_loss | -0.00291     |
|    value_loss           | 256          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.02e+03    |
|    ep_rew_mean          | 1.91e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3130        |
|    time_elapsed         | 13681       |
|    total_timesteps      | 1602560     |
| train/                  |             |
|    approx_kl            | 0.002249391 |
|    clip_fraction        | 0.00781     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.36       |
|    explained_variance   | 0.899       |
|    learning_rate        | 1e-06       |
|    loss                 | 64.6        |
|    n_updates            | 43030       |
|    policy_gradient_loss | -0.00121    |
|    value_loss           | 138         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.02e+03      |
|    ep_rew_mean          | 1.92e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3140          |
|    time_elapsed         | 13724         |
|    total_timesteps      | 1607680       |
| train/                  |               |
|    approx_kl            | 0.00085656054 |
|    clip_fraction        | 0.000391      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.446        |
|    explained_variance   | 0.891         |
|    learning_rate        | 1e-06         |
|    loss                 | 64.8          |
|    n_updates            | 43130         |
|    policy_gradient_loss | 0.000104      |
|    value_loss           | 180           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.03e+03      |
|    ep_rew_mean          | 1.93e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3150          |
|    time_elapsed         | 13768         |
|    total_timesteps      | 1612800       |
| train/                  |               |
|    approx_kl            | 0.00095017545 |
|    clip_fraction        | 0.00391       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.29         |
|    explained_variance   | 0.758         |
|    learning_rate        | 1e-06         |
|    loss                 | 111           |
|    n_updates            | 43230         |
|    policy_gradient_loss | -0.00185      |
|    value_loss           | 357           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3160         |
|    time_elapsed         | 13811        |
|    total_timesteps      | 1617920      |
| train/                  |              |
|    approx_kl            | 0.0014037625 |
|    clip_fraction        | 0.0135       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.348       |
|    explained_variance   | 0.885        |
|    learning_rate        | 1e-06        |
|    loss                 | 124          |
|    n_updates            | 43330        |
|    policy_gradient_loss | -0.00288     |
|    value_loss           | 389          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.92e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3170         |
|    time_elapsed         | 13855        |
|    total_timesteps      | 1623040      |
| train/                  |              |
|    approx_kl            | 0.0002776268 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.267       |
|    explained_variance   | 0.828        |
|    learning_rate        | 1e-06        |
|    loss                 | 80.7         |
|    n_updates            | 43430        |
|    policy_gradient_loss | -0.000631    |
|    value_loss           | 207          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3180         |
|    time_elapsed         | 13898        |
|    total_timesteps      | 1628160      |
| train/                  |              |
|    approx_kl            | 0.0046732784 |
|    clip_fraction        | 0.0174       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.554       |
|    explained_variance   | 0.967        |
|    learning_rate        | 1e-06        |
|    loss                 | 43.6         |
|    n_updates            | 43530        |
|    policy_gradient_loss | -0.00361     |
|    value_loss           | 133          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1e+03        |
|    ep_rew_mean          | 1.9e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3190         |
|    time_elapsed         | 13942        |
|    total_timesteps      | 1633280      |
| train/                  |              |
|    approx_kl            | 0.0015858201 |
|    clip_fraction        | 0.00488      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.546       |
|    explained_variance   | 0.954        |
|    learning_rate        | 1e-06        |
|    loss                 | 60.5         |
|    n_updates            | 43630        |
|    policy_gradient_loss | -0.00164     |
|    value_loss           | 178          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 996          |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3200         |
|    time_elapsed         | 13985        |
|    total_timesteps      | 1638400      |
| train/                  |              |
|    approx_kl            | 0.0006218002 |
|    clip_fraction        | 0.00176      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.227       |
|    explained_variance   | 0.368        |
|    learning_rate        | 1e-06        |
|    loss                 | 338          |
|    n_updates            | 43730        |
|    policy_gradient_loss | -0.000466    |
|    value_loss           | 701          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 999           |
|    ep_rew_mean          | 1.9e+03       |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3210          |
|    time_elapsed         | 14030         |
|    total_timesteps      | 1643520       |
| train/                  |               |
|    approx_kl            | 0.00019344687 |
|    clip_fraction        | 0.000391      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.218        |
|    explained_variance   | 0.858         |
|    learning_rate        | 1e-06         |
|    loss                 | 24.5          |
|    n_updates            | 43830         |
|    policy_gradient_loss | -0.0003       |
|    value_loss           | 72.2          |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 996         |
|    ep_rew_mean          | 1.9e+03     |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3220        |
|    time_elapsed         | 14073       |
|    total_timesteps      | 1648640     |
| train/                  |             |
|    approx_kl            | 0.002986541 |
|    clip_fraction        | 0.0215      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.397      |
|    explained_variance   | 0.921       |
|    learning_rate        | 1e-06       |
|    loss                 | 91.7        |
|    n_updates            | 43930       |
|    policy_gradient_loss | -0.00156    |
|    value_loss           | 186         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 996 

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 984           |
|    ep_rew_mean          | 1.88e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3230          |
|    time_elapsed         | 14117         |
|    total_timesteps      | 1653760       |
| train/                  |               |
|    approx_kl            | 0.00094503607 |
|    clip_fraction        | 0.0268        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.271        |
|    explained_variance   | 0.768         |
|    learning_rate        | 1e-06         |
|    loss                 | 197           |
|    n_updates            | 44030         |
|    policy_gradient_loss | -0.000588     |
|    value_loss           | 542           |
-------------------------------------------
-----------------------------------------
| rollout/                |       

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 985          |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3240         |
|    time_elapsed         | 14161        |
|    total_timesteps      | 1658880      |
| train/                  |              |
|    approx_kl            | 0.0014047949 |
|    clip_fraction        | 0.00625      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.178       |
|    explained_variance   | 0.858        |
|    learning_rate        | 1e-06        |
|    loss                 | 16.8         |
|    n_updates            | 44130        |
|    policy_gradient_loss | -0.0019      |
|    value_loss           | 56.4         |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 980          |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3250         |
|    time_elapsed         | 14204        |
|    total_timesteps      | 1664000      |
| train/                  |              |
|    approx_kl            | 0.0014788045 |
|    clip_fraction        | 0.00605      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.277       |
|    explained_variance   | 0.887        |
|    learning_rate        | 1e-06        |
|    loss                 | 99           |
|    n_updates            | 44230        |
|    policy_gradient_loss | 0.000714     |
|    value_loss           | 216          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 992         |
|    ep_rew_mean          | 1.91e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3260        |
|    time_elapsed         | 14249       |
|    total_timesteps      | 1669120     |
| train/                  |             |
|    approx_kl            | 0.002196263 |
|    clip_fraction        | 0.00645     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.546      |
|    explained_variance   | 0.893       |
|    learning_rate        | 1e-06       |
|    loss                 | 56.3        |
|    n_updates            | 44330       |
|    policy_gradient_loss | -0.0013     |
|    value_loss           | 259         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 992 

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1e+03        |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3270         |
|    time_elapsed         | 14292        |
|    total_timesteps      | 1674240      |
| train/                  |              |
|    approx_kl            | 0.0018802622 |
|    clip_fraction        | 0.00742      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.355       |
|    explained_variance   | 0.912        |
|    learning_rate        | 1e-06        |
|    loss                 | 81.8         |
|    n_updates            | 44430        |
|    policy_gradient_loss | 0.000369     |
|    value_loss           | 201          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 980          |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3280         |
|    time_elapsed         | 14336        |
|    total_timesteps      | 1679360      |
| train/                  |              |
|    approx_kl            | 0.0024358137 |
|    clip_fraction        | 0.00859      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.728       |
|    explained_variance   | 0.918        |
|    learning_rate        | 1e-06        |
|    loss                 | 45           |
|    n_updates            | 44530        |
|    policy_gradient_loss | -0.00127     |
|    value_loss           | 223          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 984         |
|    ep_rew_mean          | 1.89e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3290        |
|    time_elapsed         | 14379       |
|    total_timesteps      | 1684480     |
| train/                  |             |
|    approx_kl            | 0.007271663 |
|    clip_fraction        | 0.0498      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.565      |
|    explained_variance   | 0.942       |
|    learning_rate        | 1e-06       |
|    loss                 | 106         |
|    n_updates            | 44630       |
|    policy_gradient_loss | -0.00752    |
|    value_loss           | 220         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 989   

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 982           |
|    ep_rew_mean          | 1.88e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3300          |
|    time_elapsed         | 14423         |
|    total_timesteps      | 1689600       |
| train/                  |               |
|    approx_kl            | 0.00040378876 |
|    clip_fraction        | 0.00371       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.184        |
|    explained_variance   | 0.801         |
|    learning_rate        | 1e-06         |
|    loss                 | 32.5          |
|    n_updates            | 44730         |
|    policy_gradient_loss | -0.00176      |
|    value_loss           | 120           |
-------------------------------------------
----------------------------------------
| rollout/                |        

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 988          |
|    ep_rew_mean          | 1.9e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3310         |
|    time_elapsed         | 14467        |
|    total_timesteps      | 1694720      |
| train/                  |              |
|    approx_kl            | 0.0060200836 |
|    clip_fraction        | 0.049        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.596       |
|    explained_variance   | 0.913        |
|    learning_rate        | 1e-06        |
|    loss                 | 335          |
|    n_updates            | 44830        |
|    policy_gradient_loss | 0.000626     |
|    value_loss           | 307          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 990          |
|    ep_rew_mean          | 1.88e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3320         |
|    time_elapsed         | 14511        |
|    total_timesteps      | 1699840      |
| train/                  |              |
|    approx_kl            | 0.0036799056 |
|    clip_fraction        | 0.0244       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.499       |
|    explained_variance   | 0.898        |
|    learning_rate        | 1e-06        |
|    loss                 | 47.1         |
|    n_updates            | 44930        |
|    policy_gradient_loss | -0.00102     |
|    value_loss           | 110          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.92e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3330         |
|    time_elapsed         | 14554        |
|    total_timesteps      | 1704960      |
| train/                  |              |
|    approx_kl            | 0.0018346554 |
|    clip_fraction        | 0.0383       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.365       |
|    explained_variance   | 0.893        |
|    learning_rate        | 1e-06        |
|    loss                 | 79           |
|    n_updates            | 45030        |
|    policy_gradient_loss | -0.00042     |
|    value_loss           | 176          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.02e+03    |
|    ep_rew_mean          | 1.92e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3340        |
|    time_elapsed         | 14598       |
|    total_timesteps      | 1710080     |
| train/                  |             |
|    approx_kl            | 0.008584578 |
|    clip_fraction        | 0.0596      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.692      |
|    explained_variance   | 0.976       |
|    learning_rate        | 1e-06       |
|    loss                 | 36          |
|    n_updates            | 45130       |
|    policy_gradient_loss | -0.00408    |
|    value_loss           | 87.3        |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.02e+

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.94e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3350         |
|    time_elapsed         | 14641        |
|    total_timesteps      | 1715200      |
| train/                  |              |
|    approx_kl            | 0.0005433175 |
|    clip_fraction        | 0.00254      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.463       |
|    explained_variance   | 0.902        |
|    learning_rate        | 1e-06        |
|    loss                 | 67.7         |
|    n_updates            | 45230        |
|    policy_gradient_loss | -0.000895    |
|    value_loss           | 172          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.95e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3360         |
|    time_elapsed         | 14685        |
|    total_timesteps      | 1720320      |
| train/                  |              |
|    approx_kl            | 0.0020018776 |
|    clip_fraction        | 0.00117      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.652       |
|    explained_variance   | 0.578        |
|    learning_rate        | 1e-06        |
|    loss                 | 209          |
|    n_updates            | 45330        |
|    policy_gradient_loss | -0.00118     |
|    value_loss           | 619          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.04e+03      |
|    ep_rew_mean          | 1.95e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3370          |
|    time_elapsed         | 14729         |
|    total_timesteps      | 1725440       |
| train/                  |               |
|    approx_kl            | 0.00034794072 |
|    clip_fraction        | 0.0301        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.706        |
|    explained_variance   | -2.9          |
|    learning_rate        | 1e-06         |
|    loss                 | 25.1          |
|    n_updates            | 45430         |
|    policy_gradient_loss | 0.00158       |
|    value_loss           | 150           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.97e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3380          |
|    time_elapsed         | 14773         |
|    total_timesteps      | 1730560       |
| train/                  |               |
|    approx_kl            | 0.00033190846 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.44         |
|    explained_variance   | 0.843         |
|    learning_rate        | 1e-06         |
|    loss                 | 92.3          |
|    n_updates            | 45530         |
|    policy_gradient_loss | 0.000311      |
|    value_loss           | 209           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 1.97e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3390         |
|    time_elapsed         | 14816        |
|    total_timesteps      | 1735680      |
| train/                  |              |
|    approx_kl            | 0.0060532335 |
|    clip_fraction        | 0.0357       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.811       |
|    explained_variance   | 0.362        |
|    learning_rate        | 1e-06        |
|    loss                 | 276          |
|    n_updates            | 45630        |
|    policy_gradient_loss | -0.00372     |
|    value_loss           | 714          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 1.98e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3400         |
|    time_elapsed         | 14860        |
|    total_timesteps      | 1740800      |
| train/                  |              |
|    approx_kl            | 0.0018286993 |
|    clip_fraction        | 0.00137      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.699       |
|    explained_variance   | 0.878        |
|    learning_rate        | 1e-06        |
|    loss                 | 71.5         |
|    n_updates            | 45730        |
|    policy_gradient_loss | -0.000273    |
|    value_loss           | 174          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3410         |
|    time_elapsed         | 14904        |
|    total_timesteps      | 1745920      |
| train/                  |              |
|    approx_kl            | 0.0067352597 |
|    clip_fraction        | 0.0215       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.873       |
|    explained_variance   | 0.751        |
|    learning_rate        | 1e-06        |
|    loss                 | 57.4         |
|    n_updates            | 45830        |
|    policy_gradient_loss | -0.000592    |
|    value_loss           | 215          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.13e+03     |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3420         |
|    time_elapsed         | 14948        |
|    total_timesteps      | 1751040      |
| train/                  |              |
|    approx_kl            | 0.0019811005 |
|    clip_fraction        | 0.0162       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.354       |
|    explained_variance   | 0.878        |
|    learning_rate        | 1e-06        |
|    loss                 | 55           |
|    n_updates            | 45930        |
|    policy_gradient_loss | -0.00195     |
|    value_loss           | 206          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.12e+03     |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3430         |
|    time_elapsed         | 14991        |
|    total_timesteps      | 1756160      |
| train/                  |              |
|    approx_kl            | 0.0020419615 |
|    clip_fraction        | 0.00332      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.367       |
|    explained_variance   | 0.809        |
|    learning_rate        | 1e-06        |
|    loss                 | 62.5         |
|    n_updates            | 46030        |
|    policy_gradient_loss | -0.00148     |
|    value_loss           | 169          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.14e+03    |
|    ep_rew_mean          | 2.03e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3440        |
|    time_elapsed         | 15035       |
|    total_timesteps      | 1761280     |
| train/                  |             |
|    approx_kl            | 0.001064986 |
|    clip_fraction        | 0.000391    |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.43       |
|    explained_variance   | 0.747       |
|    learning_rate        | 1e-06       |
|    loss                 | 126         |
|    n_updates            | 46130       |
|    policy_gradient_loss | -0.00035    |
|    value_loss           | 226         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.14e+03    |
|    ep_rew_mean          | 2.02e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3450        |
|    time_elapsed         | 15078       |
|    total_timesteps      | 1766400     |
| train/                  |             |
|    approx_kl            | 0.004115939 |
|    clip_fraction        | 0.0102      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.742      |
|    explained_variance   | 0.431       |
|    learning_rate        | 1e-06       |
|    loss                 | 374         |
|    n_updates            | 46230       |
|    policy_gradient_loss | -0.00209    |
|    value_loss           | 845         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.16e+03      |
|    ep_rew_mean          | 2.05e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3460          |
|    time_elapsed         | 15123         |
|    total_timesteps      | 1771520       |
| train/                  |               |
|    approx_kl            | 0.00092762033 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.64         |
|    explained_variance   | 0.933         |
|    learning_rate        | 1e-06         |
|    loss                 | 165           |
|    n_updates            | 46330         |
|    policy_gradient_loss | -0.000338     |
|    value_loss           | 212           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.17e+03    |
|    ep_rew_mean          | 2.05e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3470        |
|    time_elapsed         | 15166       |
|    total_timesteps      | 1776640     |
| train/                  |             |
|    approx_kl            | 0.005083514 |
|    clip_fraction        | 0.0365      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.55       |
|    explained_variance   | 0.875       |
|    learning_rate        | 1e-06       |
|    loss                 | 88.4        |
|    n_updates            | 46430       |
|    policy_gradient_loss | -0.00157    |
|    value_loss           | 245         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.17

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.19e+03    |
|    ep_rew_mean          | 2.07e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3480        |
|    time_elapsed         | 15210       |
|    total_timesteps      | 1781760     |
| train/                  |             |
|    approx_kl            | 0.006078008 |
|    clip_fraction        | 0.0426      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.702      |
|    explained_variance   | 0.862       |
|    learning_rate        | 1e-06       |
|    loss                 | 75.2        |
|    n_updates            | 46530       |
|    policy_gradient_loss | -0.000924   |
|    value_loss           | 212         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.19

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.19e+03     |
|    ep_rew_mean          | 2.06e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3490         |
|    time_elapsed         | 15253        |
|    total_timesteps      | 1786880      |
| train/                  |              |
|    approx_kl            | 0.0018169257 |
|    clip_fraction        | 0.00156      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.463       |
|    explained_variance   | 0.57         |
|    learning_rate        | 1e-06        |
|    loss                 | 167          |
|    n_updates            | 46630        |
|    policy_gradient_loss | 0.00378      |
|    value_loss           | 463          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.18e+03     |
|    ep_rew_mean          | 2.05e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3500         |
|    time_elapsed         | 15298        |
|    total_timesteps      | 1792000      |
| train/                  |              |
|    approx_kl            | 0.0024625058 |
|    clip_fraction        | 0.0146       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.281       |
|    explained_variance   | 0.867        |
|    learning_rate        | 1e-06        |
|    loss                 | 27.8         |
|    n_updates            | 46730        |
|    policy_gradient_loss | -0.00243     |
|    value_loss           | 104          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.19e+03     |
|    ep_rew_mean          | 2.05e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3510         |
|    time_elapsed         | 15341        |
|    total_timesteps      | 1797120      |
| train/                  |              |
|    approx_kl            | 0.0008098844 |
|    clip_fraction        | 0.00801      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.338       |
|    explained_variance   | 0.579        |
|    learning_rate        | 1e-06        |
|    loss                 | 171          |
|    n_updates            | 46830        |
|    policy_gradient_loss | -0.000701    |
|    value_loss           | 721          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.18e+03     |
|    ep_rew_mean          | 2.05e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3520         |
|    time_elapsed         | 15385        |
|    total_timesteps      | 1802240      |
| train/                  |              |
|    approx_kl            | 0.0026678513 |
|    clip_fraction        | 0.0104       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.337       |
|    explained_variance   | 0.702        |
|    learning_rate        | 1e-06        |
|    loss                 | 74.3         |
|    n_updates            | 46930        |
|    policy_gradient_loss | -0.00128     |
|    value_loss           | 530          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.18e+03      |
|    ep_rew_mean          | 2.06e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3530          |
|    time_elapsed         | 15428         |
|    total_timesteps      | 1807360       |
| train/                  |               |
|    approx_kl            | 0.00068838336 |
|    clip_fraction        | 0.00449       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.246        |
|    explained_variance   | 0.311         |
|    learning_rate        | 1e-06         |
|    loss                 | 185           |
|    n_updates            | 47030         |
|    policy_gradient_loss | -0.00198      |
|    value_loss           | 848           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.19e+03    |
|    ep_rew_mean          | 2.08e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3540        |
|    time_elapsed         | 15473       |
|    total_timesteps      | 1812480     |
| train/                  |             |
|    approx_kl            | 0.001190886 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.656      |
|    explained_variance   | 0.429       |
|    learning_rate        | 1e-06       |
|    loss                 | 791         |
|    n_updates            | 47130       |
|    policy_gradient_loss | 0.000365    |
|    value_loss           | 937         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.19

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.18e+03     |
|    ep_rew_mean          | 2.07e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3550         |
|    time_elapsed         | 15516        |
|    total_timesteps      | 1817600      |
| train/                  |              |
|    approx_kl            | 0.0011229276 |
|    clip_fraction        | 0.00488      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.427       |
|    explained_variance   | 0.62         |
|    learning_rate        | 1e-06        |
|    loss                 | 270          |
|    n_updates            | 47230        |
|    policy_gradient_loss | 0.00181      |
|    value_loss           | 817          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.19e+03      |
|    ep_rew_mean          | 2.08e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3560          |
|    time_elapsed         | 15561         |
|    total_timesteps      | 1822720       |
| train/                  |               |
|    approx_kl            | 0.00068677973 |
|    clip_fraction        | 0.0264        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.42         |
|    explained_variance   | 0.53          |
|    learning_rate        | 1e-06         |
|    loss                 | 420           |
|    n_updates            | 47330         |
|    policy_gradient_loss | -0.000714     |
|    value_loss           | 746           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.18e+03      |
|    ep_rew_mean          | 2.06e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3570          |
|    time_elapsed         | 15604         |
|    total_timesteps      | 1827840       |
| train/                  |               |
|    approx_kl            | 0.00012110453 |
|    clip_fraction        | 0.00645       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.302        |
|    explained_variance   | 0.578         |
|    learning_rate        | 1e-06         |
|    loss                 | 193           |
|    n_updates            | 47430         |
|    policy_gradient_loss | -0.000639     |
|    value_loss           | 666           |
-------------------------------------------
------------------------------------------
| rollout/                |      

----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.17e+03   |
|    ep_rew_mean          | 2.06e+03   |
| time/                   |            |
|    fps                  | 117        |
|    iterations           | 3580       |
|    time_elapsed         | 15648      |
|    total_timesteps      | 1832960    |
| train/                  |            |
|    approx_kl            | 0.00805223 |
|    clip_fraction        | 0.0699     |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.51      |
|    explained_variance   | 0.727      |
|    learning_rate        | 1e-06      |
|    loss                 | 82         |
|    n_updates            | 47530      |
|    policy_gradient_loss | -0.00645   |
|    value_loss           | 494        |
----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.17e+03     |
|    ep_re

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.17e+03     |
|    ep_rew_mean          | 2.06e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3590         |
|    time_elapsed         | 15691        |
|    total_timesteps      | 1838080      |
| train/                  |              |
|    approx_kl            | 0.0031814054 |
|    clip_fraction        | 0.00898      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.361       |
|    explained_variance   | 0.769        |
|    learning_rate        | 1e-06        |
|    loss                 | 47           |
|    n_updates            | 47630        |
|    policy_gradient_loss | -0.00219     |
|    value_loss           | 141          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.16e+03     |
|    ep_rew_mean          | 2.08e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3600         |
|    time_elapsed         | 15735        |
|    total_timesteps      | 1843200      |
| train/                  |              |
|    approx_kl            | 0.0036946428 |
|    clip_fraction        | 0.0152       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.529       |
|    explained_variance   | 0.918        |
|    learning_rate        | 1e-06        |
|    loss                 | 51.4         |
|    n_updates            | 47730        |
|    policy_gradient_loss | 0.000208     |
|    value_loss           | 105          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.15e+03    |
|    ep_rew_mean          | 2.07e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3610        |
|    time_elapsed         | 15779       |
|    total_timesteps      | 1848320     |
| train/                  |             |
|    approx_kl            | 0.008420641 |
|    clip_fraction        | 0.0605      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.376      |
|    explained_variance   | 0.857       |
|    learning_rate        | 1e-06       |
|    loss                 | 105         |
|    n_updates            | 47830       |
|    policy_gradient_loss | -0.00392    |
|    value_loss           | 219         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.14e+03     |
|    ep_rew_mean          | 2.08e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3620         |
|    time_elapsed         | 15823        |
|    total_timesteps      | 1853440      |
| train/                  |              |
|    approx_kl            | 0.0004259079 |
|    clip_fraction        | 0.00195      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.296       |
|    explained_variance   | 0.931        |
|    learning_rate        | 1e-06        |
|    loss                 | 109          |
|    n_updates            | 47930        |
|    policy_gradient_loss | -0.00107     |
|    value_loss           | 186          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.11e+03    |
|    ep_rew_mean          | 2.05e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3630        |
|    time_elapsed         | 15866       |
|    total_timesteps      | 1858560     |
| train/                  |             |
|    approx_kl            | 0.008604162 |
|    clip_fraction        | 0.0395      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.526      |
|    explained_variance   | 0.808       |
|    learning_rate        | 1e-06       |
|    loss                 | 32.8        |
|    n_updates            | 48030       |
|    policy_gradient_loss | -0.00122    |
|    value_loss           | 95.3        |
-----------------------------------------
----------------------------------------
| rollout/                |            |
|    ep_len_mean          | 1.11e+03

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.11e+03    |
|    ep_rew_mean          | 2.04e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3640        |
|    time_elapsed         | 15910       |
|    total_timesteps      | 1863680     |
| train/                  |             |
|    approx_kl            | 0.003852629 |
|    clip_fraction        | 0.0217      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.469      |
|    explained_variance   | 0.884       |
|    learning_rate        | 1e-06       |
|    loss                 | 46.6        |
|    n_updates            | 48130       |
|    policy_gradient_loss | -0.000857   |
|    value_loss           | 218         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.11

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e+03      |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3650         |
|    time_elapsed         | 15954        |
|    total_timesteps      | 1868800      |
| train/                  |              |
|    approx_kl            | 0.0072221127 |
|    clip_fraction        | 0.025        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.502       |
|    explained_variance   | 0.887        |
|    learning_rate        | 1e-06        |
|    loss                 | 44.4         |
|    n_updates            | 48230        |
|    policy_gradient_loss | -0.00174     |
|    value_loss           | 129          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.1e+03     |
|    ep_rew_mean          | 2e+03       |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3660        |
|    time_elapsed         | 15997       |
|    total_timesteps      | 1873920     |
| train/                  |             |
|    approx_kl            | 0.002278373 |
|    clip_fraction        | 0.00156     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.406      |
|    explained_variance   | 0.845       |
|    learning_rate        | 1e-06       |
|    loss                 | 180         |
|    n_updates            | 48330       |
|    policy_gradient_loss | -0.00126    |
|    value_loss           | 377         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.1e

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3670         |
|    time_elapsed         | 16042        |
|    total_timesteps      | 1879040      |
| train/                  |              |
|    approx_kl            | 0.0007083003 |
|    clip_fraction        | 0.00313      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.562       |
|    explained_variance   | 0.91         |
|    learning_rate        | 1e-06        |
|    loss                 | 116          |
|    n_updates            | 48430        |
|    policy_gradient_loss | -0.00182     |
|    value_loss           | 170          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2.01e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3680         |
|    time_elapsed         | 16085        |
|    total_timesteps      | 1884160      |
| train/                  |              |
|    approx_kl            | 0.0006965166 |
|    clip_fraction        | 0.00137      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.488       |
|    explained_variance   | 0.749        |
|    learning_rate        | 1e-06        |
|    loss                 | 51.7         |
|    n_updates            | 48530        |
|    policy_gradient_loss | -0.00136     |
|    value_loss           | 371          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2.02e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3690         |
|    time_elapsed         | 16130        |
|    total_timesteps      | 1889280      |
| train/                  |              |
|    approx_kl            | 0.0020291444 |
|    clip_fraction        | 0.00645      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.376       |
|    explained_variance   | 0.746        |
|    learning_rate        | 1e-06        |
|    loss                 | 295          |
|    n_updates            | 48630        |
|    policy_gradient_loss | -0.000422    |
|    value_loss           | 435          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.99e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3700          |
|    time_elapsed         | 16173         |
|    total_timesteps      | 1894400       |
| train/                  |               |
|    approx_kl            | 0.00085395377 |
|    clip_fraction        | 0.00586       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.354        |
|    explained_variance   | 0.487         |
|    learning_rate        | 1e-06         |
|    loss                 | 802           |
|    n_updates            | 48730         |
|    policy_gradient_loss | 1.03e-05      |
|    value_loss           | 852           |
-------------------------------------------
-------------------------------------------
| rollout/                |     

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.07e+03      |
|    ep_rew_mean          | 1.98e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3710          |
|    time_elapsed         | 16217         |
|    total_timesteps      | 1899520       |
| train/                  |               |
|    approx_kl            | 0.00068541034 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.318        |
|    explained_variance   | 0.673         |
|    learning_rate        | 1e-06         |
|    loss                 | 77.3          |
|    n_updates            | 48830         |
|    policy_gradient_loss | 0.000321      |
|    value_loss           | 459           |
-------------------------------------------
------------------------------------------
| rollout/                |      

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.08e+03    |
|    ep_rew_mean          | 1.99e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3720        |
|    time_elapsed         | 16260       |
|    total_timesteps      | 1904640     |
| train/                  |             |
|    approx_kl            | 0.002948814 |
|    clip_fraction        | 0.0148      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.383      |
|    explained_variance   | 0.846       |
|    learning_rate        | 1e-06       |
|    loss                 | 54.4        |
|    n_updates            | 48930       |
|    policy_gradient_loss | -0.004      |
|    value_loss           | 222         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.07e+

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.09e+03     |
|    ep_rew_mean          | 2e+03        |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3730         |
|    time_elapsed         | 16304        |
|    total_timesteps      | 1909760      |
| train/                  |              |
|    approx_kl            | 0.0012604547 |
|    clip_fraction        | 0.0105       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.421       |
|    explained_variance   | 0.959        |
|    learning_rate        | 1e-06        |
|    loss                 | 73.1         |
|    n_updates            | 49030        |
|    policy_gradient_loss | -0.0027      |
|    value_loss           | 165          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.08e+03     |
|    ep_rew_mean          | 1.99e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3740         |
|    time_elapsed         | 16348        |
|    total_timesteps      | 1914880      |
| train/                  |              |
|    approx_kl            | 0.0040754466 |
|    clip_fraction        | 0.0746       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.44        |
|    explained_variance   | 0.664        |
|    learning_rate        | 1e-06        |
|    loss                 | 233          |
|    n_updates            | 49130        |
|    policy_gradient_loss | -0.00563     |
|    value_loss           | 534          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.07e+03    |
|    ep_rew_mean          | 1.97e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3750        |
|    time_elapsed         | 16392       |
|    total_timesteps      | 1920000     |
| train/                  |             |
|    approx_kl            | 0.001918263 |
|    clip_fraction        | 0.00566     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.482      |
|    explained_variance   | 0.935       |
|    learning_rate        | 1e-06       |
|    loss                 | 44.9        |
|    n_updates            | 49230       |
|    policy_gradient_loss | 0.000179    |
|    value_loss           | 177         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.07

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.05e+03    |
|    ep_rew_mean          | 1.93e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3760        |
|    time_elapsed         | 16435       |
|    total_timesteps      | 1925120     |
| train/                  |             |
|    approx_kl            | 0.001579847 |
|    clip_fraction        | 0.00508     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.353      |
|    explained_variance   | 0.708       |
|    learning_rate        | 1e-06       |
|    loss                 | 306         |
|    n_updates            | 49330       |
|    policy_gradient_loss | -0.00314    |
|    value_loss           | 559         |
-----------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05

-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.06e+03    |
|    ep_rew_mean          | 1.94e+03    |
| time/                   |             |
|    fps                  | 117         |
|    iterations           | 3770        |
|    time_elapsed         | 16479       |
|    total_timesteps      | 1930240     |
| train/                  |             |
|    approx_kl            | 0.005300073 |
|    clip_fraction        | 0.049       |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.519      |
|    explained_variance   | 0.733       |
|    learning_rate        | 1e-06       |
|    loss                 | 43.5        |
|    n_updates            | 49430       |
|    policy_gradient_loss | 0.00338     |
|    value_loss           | 177         |
-----------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_mean          | 1.06e+

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05e+03     |
|    ep_rew_mean          | 1.93e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3780         |
|    time_elapsed         | 16522        |
|    total_timesteps      | 1935360      |
| train/                  |              |
|    approx_kl            | 0.0044438066 |
|    clip_fraction        | 0.0301       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.212       |
|    explained_variance   | 0.442        |
|    learning_rate        | 1e-06        |
|    loss                 | 233          |
|    n_updates            | 49530        |
|    policy_gradient_loss | -0.00478     |
|    value_loss           | 846          |
------------------------------------------
-------------------------------------------
| rollout/                |               |
|    ep_l

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.91e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3790         |
|    time_elapsed         | 16566        |
|    total_timesteps      | 1940480      |
| train/                  |              |
|    approx_kl            | 0.0003570856 |
|    clip_fraction        | 0.00215      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.168       |
|    explained_variance   | 0.79         |
|    learning_rate        | 1e-06        |
|    loss                 | 200          |
|    n_updates            | 49630        |
|    policy_gradient_loss | -0.00196     |
|    value_loss           | 510          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.9e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3800         |
|    time_elapsed         | 16610        |
|    total_timesteps      | 1945600      |
| train/                  |              |
|    approx_kl            | 0.0007359348 |
|    clip_fraction        | 0.00605      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.186       |
|    explained_variance   | 0.912        |
|    learning_rate        | 1e-06        |
|    loss                 | 45.1         |
|    n_updates            | 49730        |
|    policy_gradient_loss | -0.000847    |
|    value_loss           | 149          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

-------------------------------------------
| rollout/                |               |
|    ep_len_mean          | 1.03e+03      |
|    ep_rew_mean          | 1.88e+03      |
| time/                   |               |
|    fps                  | 117           |
|    iterations           | 3810          |
|    time_elapsed         | 16654         |
|    total_timesteps      | 1950720       |
| train/                  |               |
|    approx_kl            | 0.00047897117 |
|    clip_fraction        | 0.00293       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.293        |
|    explained_variance   | 0.772         |
|    learning_rate        | 1e-06         |
|    loss                 | 45.2          |
|    n_updates            | 49830         |
|    policy_gradient_loss | 0.000276      |
|    value_loss           | 192           |
-------------------------------------------
------------------------------------------
| rollout/                |      

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.02e+03     |
|    ep_rew_mean          | 1.86e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3820         |
|    time_elapsed         | 16697        |
|    total_timesteps      | 1955840      |
| train/                  |              |
|    approx_kl            | 0.0016157769 |
|    clip_fraction        | 0.0303       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.316       |
|    explained_variance   | 0.706        |
|    learning_rate        | 1e-06        |
|    loss                 | 186          |
|    n_updates            | 49930        |
|    policy_gradient_loss | -0.00169     |
|    value_loss           | 530          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.86e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3830         |
|    time_elapsed         | 16741        |
|    total_timesteps      | 1960960      |
| train/                  |              |
|    approx_kl            | 0.0070431065 |
|    clip_fraction        | 0.0256       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.387       |
|    explained_variance   | 0.851        |
|    learning_rate        | 1e-06        |
|    loss                 | 30.4         |
|    n_updates            | 50030        |
|    policy_gradient_loss | -0.00369     |
|    value_loss           | 121          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.05e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3840         |
|    time_elapsed         | 16784        |
|    total_timesteps      | 1966080      |
| train/                  |              |
|    approx_kl            | 0.0023196125 |
|    clip_fraction        | 0.00332      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.357       |
|    explained_variance   | 0.853        |
|    learning_rate        | 1e-06        |
|    loss                 | 91.3         |
|    n_updates            | 50130        |
|    policy_gradient_loss | -0.00171     |
|    value_loss           | 216          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3850         |
|    time_elapsed         | 16828        |
|    total_timesteps      | 1971200      |
| train/                  |              |
|    approx_kl            | 0.0010124632 |
|    clip_fraction        | 0.00723      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.422       |
|    explained_variance   | 0.387        |
|    learning_rate        | 1e-06        |
|    loss                 | 341          |
|    n_updates            | 50230        |
|    policy_gradient_loss | 0.00232      |
|    value_loss           | 851          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.03e+03     |
|    ep_rew_mean          | 1.89e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3860         |
|    time_elapsed         | 16872        |
|    total_timesteps      | 1976320      |
| train/                  |              |
|    approx_kl            | 0.0067122355 |
|    clip_fraction        | 0.0539       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.601       |
|    explained_variance   | 0.881        |
|    learning_rate        | 1e-06        |
|    loss                 | 117          |
|    n_updates            | 50330        |
|    policy_gradient_loss | -0.00318     |
|    value_loss           | 262          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.9e+03      |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3870         |
|    time_elapsed         | 16916        |
|    total_timesteps      | 1981440      |
| train/                  |              |
|    approx_kl            | 0.0071572727 |
|    clip_fraction        | 0.0775       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.505       |
|    explained_variance   | 0.911        |
|    learning_rate        | 1e-06        |
|    loss                 | 28.2         |
|    n_updates            | 50430        |
|    policy_gradient_loss | -0.00437     |
|    value_loss           | 81.6         |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.91e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3880         |
|    time_elapsed         | 16959        |
|    total_timesteps      | 1986560      |
| train/                  |              |
|    approx_kl            | 0.0011261684 |
|    clip_fraction        | 0.0041       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.345       |
|    explained_variance   | 0.922        |
|    learning_rate        | 1e-06        |
|    loss                 | 62.1         |
|    n_updates            | 50530        |
|    policy_gradient_loss | -0.0008      |
|    value_loss           | 245          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.91e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3890         |
|    time_elapsed         | 17004        |
|    total_timesteps      | 1991680      |
| train/                  |              |
|    approx_kl            | 0.0019688713 |
|    clip_fraction        | 0.00781      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.317       |
|    explained_variance   | 0.874        |
|    learning_rate        | 1e-06        |
|    loss                 | 69.1         |
|    n_updates            | 50630        |
|    policy_gradient_loss | -0.00205     |
|    value_loss           | 284          |
------------------------------------------
------------------------------------------
| rollout/                |              |
|    ep_len

------------------------------------------
| rollout/                |              |
|    ep_len_mean          | 1.04e+03     |
|    ep_rew_mean          | 1.91e+03     |
| time/                   |              |
|    fps                  | 117          |
|    iterations           | 3900         |
|    time_elapsed         | 17047        |
|    total_timesteps      | 1996800      |
| train/                  |              |
|    approx_kl            | 0.0013920767 |
|    clip_fraction        | 0.00586      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.328       |
|    explained_variance   | 0.971        |
|    learning_rate        | 1e-06        |
|    loss                 | 23.5         |
|    n_updates            | 50730        |
|    policy_gradient_loss | -0.00193     |
|    value_loss           | 147          |
------------------------------------------
-----------------------------------------
| rollout/                |             |
|    ep_len_m

<stable_baselines3.ppo.ppo.PPO at 0x12741ed41c0>

In [15]:
model.save("pporandommodel")