# 1. Setup

In [None]:
!pip install gym_super_mario_bros==7.3.0 nes_py

In [1]:
#Import the game
import gym_super_mario_bros

#Import the Joypad wrapper
from nes_py.wrappers import JoypadSpace

#Import the simplified controls
from gym_super_mario_bros.actions import SIMPLE_MOVEMENT

In [None]:
#Setup the game
env = gym_super_mario_bros.make('SuperMarioBros-v0')
env = JoypadSpace(env, SIMPLE_MOVEMENT)

In [None]:
#Create a flag -> Restart the game or not
restart = True

#Loop through each frame in the game
for step in range(100000):
    if restart:
        #Restart the game
        env.reset()
    #Do random action
    state, reward, restart, info = env.step(env.action_space.sample())
    #Display the game
    env.render()
#Close the game
env.close()

In [None]:
env.close()

# 2. Preprocess the Environment

In [None]:
#Install PyTorch
!pip install torch==1.10.1+cu113 torchvision==0.11.2+cu113 torchaudio===0.10.1+cu113 -f https://download.pytorch.org/whl/cu113/torch_stable.html

In [None]:
#Install stable baselines for Reinforced Learning
!pip install stable-baselines3[extra]

In [2]:
# Import Frame Stacker Wrapper and GrayScaling Wrapper
from gym.wrappers import GrayScaleObservation
# Import Vectorization Wrappers
from stable_baselines3.common.vec_env import VecFrameStack, DummyVecEnv
# Import Matplotlib to show the impact of frame stacking
from matplotlib import pyplot as plt

In [3]:
# 1. Create the base environment
env = gym_super_mario_bros.make('SuperMarioBros-v0')
# 2. Simplify the controls 
env = JoypadSpace(env, SIMPLE_MOVEMENT)
# 3. Grayscale
env = GrayScaleObservation(env, keep_dim=True)
# 4. Wrap inside the Dummy Environment
env = DummyVecEnv([lambda: env])
# 5. Stack the frames
env = VecFrameStack(env, 4, channels_order='last')

# 3. Train The Model

In [4]:
# Import os for file path management
import os 
# Import PPO for algos
from stable_baselines3 import PPO
# Import Base Callback for saving models
from stable_baselines3.common.callbacks import BaseCallback

In [5]:
class TrainAndLoggingCallback(BaseCallback):

    def __init__(self, check_freq, save_path, verbose=1):
        super(TrainAndLoggingCallback, self).__init__(verbose)
        self.check_freq = check_freq
        self.save_path = save_path

    def _init_callback(self):
        if self.save_path is not None:
            os.makedirs(self.save_path, exist_ok=True)

    def _on_step(self):
        if self.n_calls % self.check_freq == 0:
            model_path = os.path.join(self.save_path, 'best_model_{}'.format(self.n_calls))
            self.model.save(model_path)

        return True

In [6]:
CHECKPOINT_DIR = './train/'
LOG_DIR = './logs/'

In [7]:
# Setup model saving callback
callback = TrainAndLoggingCallback(check_freq=100000, save_path=CHECKPOINT_DIR)

In [8]:
# This is the AI model started
model = PPO('CnnPolicy', env, verbose=1, tensorboard_log=LOG_DIR, learning_rate=0.000001, 
            n_steps=512) 

Using cuda device
Wrapping the env in a VecTransposeImage.


In [None]:
# Train the AI model, this is where the AI model starts to learn
model.learn(total_timesteps=5000000, callback=callback)

Logging to ./logs/PPO_4


  return (self.ram[0x86] - self.ram[0x071c]) % 256


----------------------------
| time/              |     |
|    fps             | 7   |
|    iterations      | 1   |
|    time_elapsed    | 67  |
|    total_timesteps | 512 |
----------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2             |
|    time_elapsed         | 103           |
|    total_timesteps      | 1024          |
| train/                  |               |
|    approx_kl            | 2.8963666e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.95         |
|    explained_variance   | 0.00636       |
|    learning_rate        | 1e-06         |
|    loss                 | 114           |
|    n_updates            | 10            |
|    policy_gradient_loss | -0.000408     |
|    value_loss           | 291           |
-------------------------------------------
-----

-------------------------------------------
| time/                   |               |
|    fps                  | 13            |
|    iterations           | 13            |
|    time_elapsed         | 492           |
|    total_timesteps      | 6656          |
| train/                  |               |
|    approx_kl            | 2.5687274e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.0088       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.082         |
|    n_updates            | 120           |
|    policy_gradient_loss | -0.000283     |
|    value_loss           | 0.202         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 13           |
|    iterations           | 14           |
|    time_elapsed         | 522     

-------------------------------------------
| time/                   |               |
|    fps                  | 14            |
|    iterations           | 24            |
|    time_elapsed         | 825           |
|    total_timesteps      | 12288         |
| train/                  |               |
|    approx_kl            | 3.1109666e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | 0.00657       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.158         |
|    n_updates            | 230           |
|    policy_gradient_loss | -0.000304     |
|    value_loss           | 0.391         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 14           |
|    iterations           | 25           |
|    time_elapsed         | 853     

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 35            |
|    time_elapsed         | 1138          |
|    total_timesteps      | 17920         |
| train/                  |               |
|    approx_kl            | 2.3184228e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.0525        |
|    learning_rate        | 1e-06         |
|    loss                 | 5.97          |
|    n_updates            | 340           |
|    policy_gradient_loss | -0.000252     |
|    value_loss           | 23.9          |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 36            |
|    time_elapsed         | 1167

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 46            |
|    time_elapsed         | 1483          |
|    total_timesteps      | 23552         |
| train/                  |               |
|    approx_kl            | 3.0030147e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | -0.104        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0462        |
|    n_updates            | 450           |
|    policy_gradient_loss | -0.000201     |
|    value_loss           | 0.137         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 47           |
|    time_elapsed         | 1513    

-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 57          |
|    time_elapsed         | 1872        |
|    total_timesteps      | 29184       |
| train/                  |             |
|    approx_kl            | 8.16863e-05 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.91       |
|    explained_variance   | 0.00602     |
|    learning_rate        | 1e-06       |
|    loss                 | 0.226       |
|    n_updates            | 560         |
|    policy_gradient_loss | 0.000121    |
|    value_loss           | 2.34        |
-----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 58            |
|    time_elapsed         | 1909          |
|    total_timesteps    

----------------------------------------
| time/                   |            |
|    fps                  | 15         |
|    iterations           | 68         |
|    time_elapsed         | 2261       |
|    total_timesteps      | 34816      |
| train/                  |            |
|    approx_kl            | 0.00015389 |
|    clip_fraction        | 0          |
|    clip_range           | 0.2        |
|    entropy_loss         | -1.89      |
|    explained_variance   | 0.249      |
|    learning_rate        | 1e-06      |
|    loss                 | 42.3       |
|    n_updates            | 670        |
|    policy_gradient_loss | -0.00048   |
|    value_loss           | 86.4       |
----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 69            |
|    time_elapsed         | 2294          |
|    total_timesteps      | 35328         

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 79           |
|    time_elapsed         | 2643         |
|    total_timesteps      | 40448        |
| train/                  |              |
|    approx_kl            | 5.851942e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | -0.0623      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0709       |
|    n_updates            | 780          |
|    policy_gradient_loss | -0.000219    |
|    value_loss           | 0.171        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 80            |
|    time_elapsed         | 2676          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 90           |
|    time_elapsed         | 3022         |
|    total_timesteps      | 46080        |
| train/                  |              |
|    approx_kl            | 7.899373e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.636        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.189        |
|    n_updates            | 890          |
|    policy_gradient_loss | -0.000332    |
|    value_loss           | 0.554        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 91           |
|    time_elapsed         | 3056         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 101           |
|    time_elapsed         | 3397          |
|    total_timesteps      | 51712         |
| train/                  |               |
|    approx_kl            | 0.00020597049 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.281         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.262         |
|    n_updates            | 1000          |
|    policy_gradient_loss | -0.000227     |
|    value_loss           | 0.73          |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 102           |
|    time_elapsed         | 3429

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 112           |
|    time_elapsed         | 3769          |
|    total_timesteps      | 57344         |
| train/                  |               |
|    approx_kl            | 0.00020582392 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.87         |
|    explained_variance   | -0.00955      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.05          |
|    n_updates            | 1110          |
|    policy_gradient_loss | -0.000891     |
|    value_loss           | 0.143         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 113          |
|    time_elapsed         | 3801    

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 123           |
|    time_elapsed         | 4143          |
|    total_timesteps      | 62976         |
| train/                  |               |
|    approx_kl            | 0.00016503572 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.85         |
|    explained_variance   | -0.0104       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0352        |
|    n_updates            | 1220          |
|    policy_gradient_loss | -0.000718     |
|    value_loss           | 0.19          |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 124           |
|    time_elapsed         | 4177

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 134          |
|    time_elapsed         | 4487         |
|    total_timesteps      | 68608        |
| train/                  |              |
|    approx_kl            | 0.0002186005 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.00449      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.14         |
|    n_updates            | 1330         |
|    policy_gradient_loss | -0.000883    |
|    value_loss           | 0.56         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 135          |
|    time_elapsed         | 4515         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 145           |
|    time_elapsed         | 4804          |
|    total_timesteps      | 74240         |
| train/                  |               |
|    approx_kl            | 2.6454916e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.519         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.168         |
|    n_updates            | 1440          |
|    policy_gradient_loss | -0.00015      |
|    value_loss           | 1.08          |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 146         |
|    time_elapsed         | 4833        

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 156          |
|    time_elapsed         | 5118         |
|    total_timesteps      | 79872        |
| train/                  |              |
|    approx_kl            | 0.0001013045 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.84        |
|    explained_variance   | 0.447        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.108        |
|    n_updates            | 1550         |
|    policy_gradient_loss | -0.00044     |
|    value_loss           | 0.664        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 157           |
|    time_elapsed         | 5146          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 167           |
|    time_elapsed         | 5436          |
|    total_timesteps      | 85504         |
| train/                  |               |
|    approx_kl            | 0.00015527674 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.84         |
|    explained_variance   | 0.0305        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0889        |
|    n_updates            | 1660          |
|    policy_gradient_loss | -0.000488     |
|    value_loss           | 0.416         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 168           |
|    time_elapsed         | 5464

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 178           |
|    time_elapsed         | 5755          |
|    total_timesteps      | 91136         |
| train/                  |               |
|    approx_kl            | 3.7533697e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.81         |
|    explained_variance   | 0.442         |
|    learning_rate        | 1e-06         |
|    loss                 | 38.1          |
|    n_updates            | 1770          |
|    policy_gradient_loss | 7.79e-05      |
|    value_loss           | 84.5          |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 179           |
|    time_elapsed         | 5784

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 189          |
|    time_elapsed         | 6066         |
|    total_timesteps      | 96768        |
| train/                  |              |
|    approx_kl            | 4.967919e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.83        |
|    explained_variance   | 0.265        |
|    learning_rate        | 1e-06        |
|    loss                 | 23.5         |
|    n_updates            | 1880         |
|    policy_gradient_loss | -0.000372    |
|    value_loss           | 54.6         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 190           |
|    time_elapsed         | 6093          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 200           |
|    time_elapsed         | 6378          |
|    total_timesteps      | 102400        |
| train/                  |               |
|    approx_kl            | 0.00060341274 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.79         |
|    explained_variance   | -0.00679      |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0458        |
|    n_updates            | 1990          |
|    policy_gradient_loss | -0.00168      |
|    value_loss           | 0.143         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 201           |
|    time_elapsed         | 6407

-----------------------------------------
| time/                   |             |
|    fps                  | 16          |
|    iterations           | 211         |
|    time_elapsed         | 6691        |
|    total_timesteps      | 108032      |
| train/                  |             |
|    approx_kl            | 0.000767382 |
|    clip_fraction        | 0.000195    |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.65       |
|    explained_variance   | 0.602       |
|    learning_rate        | 1e-06       |
|    loss                 | 58.5        |
|    n_updates            | 2100        |
|    policy_gradient_loss | -0.000102   |
|    value_loss           | 131         |
-----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 212           |
|    time_elapsed         | 6718          |
|    total_timesteps    

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 222          |
|    time_elapsed         | 7003         |
|    total_timesteps      | 113664       |
| train/                  |              |
|    approx_kl            | 0.0003519886 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.75        |
|    explained_variance   | 0.00335      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0671       |
|    n_updates            | 2210         |
|    policy_gradient_loss | -0.00116     |
|    value_loss           | 0.2          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 223          |
|    time_elapsed         | 7032         |
|    total_

--------------------------------------------
| time/                   |                |
|    fps                  | 16             |
|    iterations           | 233            |
|    time_elapsed         | 7316           |
|    total_timesteps      | 119296         |
| train/                  |                |
|    approx_kl            | 0.000120378914 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -1.75          |
|    explained_variance   | 0.0107         |
|    learning_rate        | 1e-06          |
|    loss                 | 0.131          |
|    n_updates            | 2320           |
|    policy_gradient_loss | -0.000386      |
|    value_loss           | 0.31           |
--------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 234          |
|    time_elapsed 

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 244          |
|    time_elapsed         | 8282         |
|    total_timesteps      | 124928       |
| train/                  |              |
|    approx_kl            | 0.0003164435 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.7         |
|    explained_variance   | 0.0368       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.13         |
|    n_updates            | 2430         |
|    policy_gradient_loss | -0.000801    |
|    value_loss           | 1.61         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 245          |
|    time_elapsed         | 8311         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 255          |
|    time_elapsed         | 8601         |
|    total_timesteps      | 130560       |
| train/                  |              |
|    approx_kl            | 0.0005519547 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.73        |
|    explained_variance   | 0.00898      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0669       |
|    n_updates            | 2540         |
|    policy_gradient_loss | -0.0013      |
|    value_loss           | 0.197        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 256           |
|    time_elapsed         | 8631          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 266          |
|    time_elapsed         | 8917         |
|    total_timesteps      | 136192       |
| train/                  |              |
|    approx_kl            | 0.0005133104 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.72        |
|    explained_variance   | 0.000378     |
|    learning_rate        | 1e-06        |
|    loss                 | 0.174        |
|    n_updates            | 2650         |
|    policy_gradient_loss | -0.00179     |
|    value_loss           | 0.29         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 267           |
|    time_elapsed         | 8944          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 277           |
|    time_elapsed         | 9229          |
|    total_timesteps      | 141824        |
| train/                  |               |
|    approx_kl            | 0.00016239064 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.69         |
|    explained_variance   | 0.0423        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.179         |
|    n_updates            | 2760          |
|    policy_gradient_loss | 0.000414      |
|    value_loss           | 2.3           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 278           |
|    time_elapsed         | 9258

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 288          |
|    time_elapsed         | 9539         |
|    total_timesteps      | 147456       |
| train/                  |              |
|    approx_kl            | 0.0008876525 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.7         |
|    explained_variance   | 0.0405       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0665       |
|    n_updates            | 2870         |
|    policy_gradient_loss | -0.00165     |
|    value_loss           | 0.233        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 289           |
|    time_elapsed         | 9566          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 299          |
|    time_elapsed         | 9849         |
|    total_timesteps      | 153088       |
| train/                  |              |
|    approx_kl            | 0.0006431587 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.63        |
|    explained_variance   | -0.0111      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.372        |
|    n_updates            | 2980         |
|    policy_gradient_loss | -0.00106     |
|    value_loss           | 3.91         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 300           |
|    time_elapsed         | 9877          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 310          |
|    time_elapsed         | 10182        |
|    total_timesteps      | 158720       |
| train/                  |              |
|    approx_kl            | 0.0002504919 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.68        |
|    explained_variance   | -0.0375      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0396       |
|    n_updates            | 3090         |
|    policy_gradient_loss | -0.000432    |
|    value_loss           | 0.137        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 311          |
|    time_elapsed         | 10215        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 321          |
|    time_elapsed         | 10509        |
|    total_timesteps      | 164352       |
| train/                  |              |
|    approx_kl            | 0.0017757119 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.65        |
|    explained_variance   | 0.0323       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.121        |
|    n_updates            | 3200         |
|    policy_gradient_loss | -0.00379     |
|    value_loss           | 0.223        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 322           |
|    time_elapsed         | 10537         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 332           |
|    time_elapsed         | 10831         |
|    total_timesteps      | 169984        |
| train/                  |               |
|    approx_kl            | 0.00012880098 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.56         |
|    explained_variance   | -0.147        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0888        |
|    n_updates            | 3310          |
|    policy_gradient_loss | -0.000182     |
|    value_loss           | 0.229         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 333           |
|    time_elapsed         | 1086

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 343          |
|    time_elapsed         | 11155        |
|    total_timesteps      | 175616       |
| train/                  |              |
|    approx_kl            | 0.0017068426 |
|    clip_fraction        | 0.00137      |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.46        |
|    explained_variance   | 0.701        |
|    learning_rate        | 1e-06        |
|    loss                 | 87.9         |
|    n_updates            | 3420         |
|    policy_gradient_loss | 0.00148      |
|    value_loss           | 248          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 344          |
|    time_elapsed         | 11184        |
|    total_

-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 354         |
|    time_elapsed         | 11472       |
|    total_timesteps      | 181248      |
| train/                  |             |
|    approx_kl            | 0.000535629 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.48       |
|    explained_variance   | 0.0192      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0441      |
|    n_updates            | 3530        |
|    policy_gradient_loss | -0.00111    |
|    value_loss           | 0.109       |
-----------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 355         |
|    time_elapsed         | 11501       |
|    total_timesteps      | 181760

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 365          |
|    time_elapsed         | 11783        |
|    total_timesteps      | 186880       |
| train/                  |              |
|    approx_kl            | 0.0007315978 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.37        |
|    explained_variance   | 0.0237       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.152        |
|    n_updates            | 3640         |
|    policy_gradient_loss | -0.00134     |
|    value_loss           | 0.295        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 366          |
|    time_elapsed         | 11811        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 376          |
|    time_elapsed         | 12089        |
|    total_timesteps      | 192512       |
| train/                  |              |
|    approx_kl            | 0.0006792046 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.29        |
|    explained_variance   | 0.0204       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0401       |
|    n_updates            | 3750         |
|    policy_gradient_loss | -0.000978    |
|    value_loss           | 0.176        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 377           |
|    time_elapsed         | 12117         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 387           |
|    time_elapsed         | 12395         |
|    total_timesteps      | 198144        |
| train/                  |               |
|    approx_kl            | 0.00011164823 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.27         |
|    explained_variance   | 0.0131        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0518        |
|    n_updates            | 3860          |
|    policy_gradient_loss | -0.000174     |
|    value_loss           | 0.0974        |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 388          |
|    time_elapsed         | 12422   

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 398          |
|    time_elapsed         | 12716        |
|    total_timesteps      | 203776       |
| train/                  |              |
|    approx_kl            | 8.687435e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.17        |
|    explained_variance   | 0.11         |
|    learning_rate        | 1e-06        |
|    loss                 | 0.061        |
|    n_updates            | 3970         |
|    policy_gradient_loss | -0.000506    |
|    value_loss           | 0.22         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 399           |
|    time_elapsed         | 12746         |
|    t

--------------------------------------------
| time/                   |                |
|    fps                  | 16             |
|    iterations           | 409            |
|    time_elapsed         | 13034          |
|    total_timesteps      | 209408         |
| train/                  |                |
|    approx_kl            | 0.000118567375 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -0.942         |
|    explained_variance   | -0.0355        |
|    learning_rate        | 1e-06          |
|    loss                 | 0.0688         |
|    n_updates            | 4080           |
|    policy_gradient_loss | -0.000135      |
|    value_loss           | 0.309          |
--------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 410           |
|    time_elap

-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 420         |
|    time_elapsed         | 14163       |
|    total_timesteps      | 215040      |
| train/                  |             |
|    approx_kl            | 0.000840624 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.834      |
|    explained_variance   | -0.00444    |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0504      |
|    n_updates            | 4190        |
|    policy_gradient_loss | -0.00136    |
|    value_loss           | 0.11        |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 421          |
|    time_elapsed         | 14191        |
|    total_timesteps      | 2

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 431          |
|    time_elapsed         | 14496        |
|    total_timesteps      | 220672       |
| train/                  |              |
|    approx_kl            | 0.0002324587 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.879       |
|    explained_variance   | -0.0112      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0848       |
|    n_updates            | 4300         |
|    policy_gradient_loss | -0.000464    |
|    value_loss           | 0.246        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 432          |
|    time_elapsed         | 14526        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 442          |
|    time_elapsed         | 14818        |
|    total_timesteps      | 226304       |
| train/                  |              |
|    approx_kl            | 0.0011542748 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.851       |
|    explained_variance   | -0.115       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0405       |
|    n_updates            | 4410         |
|    policy_gradient_loss | -0.00154     |
|    value_loss           | 0.106        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 443          |
|    time_elapsed         | 14845        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 453           |
|    time_elapsed         | 15125         |
|    total_timesteps      | 231936        |
| train/                  |               |
|    approx_kl            | 0.00033224514 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.426        |
|    explained_variance   | 0.741         |
|    learning_rate        | 1e-06         |
|    loss                 | 73.3          |
|    n_updates            | 4520          |
|    policy_gradient_loss | 5.24e-05      |
|    value_loss           | 192           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 454           |
|    time_elapsed         | 1515

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 464           |
|    time_elapsed         | 15443         |
|    total_timesteps      | 237568        |
| train/                  |               |
|    approx_kl            | 0.00082908035 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.64         |
|    explained_variance   | -0.0913       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0657        |
|    n_updates            | 4630          |
|    policy_gradient_loss | -0.00262      |
|    value_loss           | 0.336         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 465           |
|    time_elapsed         | 1547

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 475          |
|    time_elapsed         | 15763        |
|    total_timesteps      | 243200       |
| train/                  |              |
|    approx_kl            | 0.0003283578 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.562       |
|    explained_variance   | -0.145       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0461       |
|    n_updates            | 4740         |
|    policy_gradient_loss | -0.000862    |
|    value_loss           | 0.176        |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 476         |
|    time_elapsed         | 15793       |
|    total_times

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 486           |
|    time_elapsed         | 16083         |
|    total_timesteps      | 248832        |
| train/                  |               |
|    approx_kl            | 0.00097546354 |
|    clip_fraction        | 0.00313       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.635        |
|    explained_variance   | 0.0145        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.801         |
|    n_updates            | 4850          |
|    policy_gradient_loss | 0.00215       |
|    value_loss           | 13.3          |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 487           |
|    time_elapsed         | 1611

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 497          |
|    time_elapsed         | 16404        |
|    total_timesteps      | 254464       |
| train/                  |              |
|    approx_kl            | 0.0012399178 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.869       |
|    explained_variance   | -0.0125      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0557       |
|    n_updates            | 4960         |
|    policy_gradient_loss | -0.00109     |
|    value_loss           | 0.106        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 498          |
|    time_elapsed         | 16435        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 508          |
|    time_elapsed         | 16726        |
|    total_timesteps      | 260096       |
| train/                  |              |
|    approx_kl            | 0.0009246047 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.873       |
|    explained_variance   | 0.0663       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0703       |
|    n_updates            | 5070         |
|    policy_gradient_loss | -0.00142     |
|    value_loss           | 0.157        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 509           |
|    time_elapsed         | 16754         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 519           |
|    time_elapsed         | 17075         |
|    total_timesteps      | 265728        |
| train/                  |               |
|    approx_kl            | 0.00097500836 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.03         |
|    explained_variance   | -0.031        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0884        |
|    n_updates            | 5180          |
|    policy_gradient_loss | -0.00151      |
|    value_loss           | 0.263         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 520          |
|    time_elapsed         | 17114   

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 530          |
|    time_elapsed         | 17502        |
|    total_timesteps      | 271360       |
| train/                  |              |
|    approx_kl            | 0.0061681243 |
|    clip_fraction        | 0.0135       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.918       |
|    explained_variance   | -0.0356      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0209       |
|    n_updates            | 5290         |
|    policy_gradient_loss | -0.00754     |
|    value_loss           | 0.113        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 531          |
|    time_elapsed         | 17535        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 541           |
|    time_elapsed         | 17844         |
|    total_timesteps      | 276992        |
| train/                  |               |
|    approx_kl            | 0.00033700047 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.868        |
|    explained_variance   | -0.139        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0411        |
|    n_updates            | 5400          |
|    policy_gradient_loss | -0.00069      |
|    value_loss           | 0.165         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 542           |
|    time_elapsed         | 1787

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 552          |
|    time_elapsed         | 18166        |
|    total_timesteps      | 282624       |
| train/                  |              |
|    approx_kl            | 0.0007393339 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.991       |
|    explained_variance   | 0.188        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0705       |
|    n_updates            | 5510         |
|    policy_gradient_loss | -0.00189     |
|    value_loss           | 0.217        |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 553         |
|    time_elapsed         | 18194       |
|    total_times

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 563          |
|    time_elapsed         | 18488        |
|    total_timesteps      | 288256       |
| train/                  |              |
|    approx_kl            | 0.0022997991 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.11        |
|    explained_variance   | -0.0228      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0501       |
|    n_updates            | 5620         |
|    policy_gradient_loss | -0.00131     |
|    value_loss           | 0.111        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 564          |
|    time_elapsed         | 18518        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 574          |
|    time_elapsed         | 18810        |
|    total_timesteps      | 293888       |
| train/                  |              |
|    approx_kl            | 0.0013775078 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.22        |
|    explained_variance   | -0.173       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.106        |
|    n_updates            | 5730         |
|    policy_gradient_loss | -0.0018      |
|    value_loss           | 0.177        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 575           |
|    time_elapsed         | 18839         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 585          |
|    time_elapsed         | 19129        |
|    total_timesteps      | 299520       |
| train/                  |              |
|    approx_kl            | 3.515836e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.19        |
|    explained_variance   | 0.837        |
|    learning_rate        | 1e-06        |
|    loss                 | 25.1         |
|    n_updates            | 5840         |
|    policy_gradient_loss | 4.91e-07     |
|    value_loss           | 155          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 586          |
|    time_elapsed         | 19162        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 596          |
|    time_elapsed         | 19456        |
|    total_timesteps      | 305152       |
| train/                  |              |
|    approx_kl            | 0.0016289927 |
|    clip_fraction        | 0.00137      |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.11        |
|    explained_variance   | 0.899        |
|    learning_rate        | 1e-06        |
|    loss                 | 94.4         |
|    n_updates            | 5950         |
|    policy_gradient_loss | 0.000362     |
|    value_loss           | 214          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 597           |
|    time_elapsed         | 19489         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 607           |
|    time_elapsed         | 19854         |
|    total_timesteps      | 310784        |
| train/                  |               |
|    approx_kl            | 0.00059904566 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.2          |
|    explained_variance   | -0.0667       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0673        |
|    n_updates            | 6060          |
|    policy_gradient_loss | -0.000987     |
|    value_loss           | 0.119         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 608          |
|    time_elapsed         | 19889   

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 618          |
|    time_elapsed         | 20293        |
|    total_timesteps      | 316416       |
| train/                  |              |
|    approx_kl            | 0.0018594593 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.2         |
|    explained_variance   | 0.00108      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0573       |
|    n_updates            | 6170         |
|    policy_gradient_loss | -0.00152     |
|    value_loss           | 0.153        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 619          |
|    time_elapsed         | 20338        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 629           |
|    time_elapsed         | 20767         |
|    total_timesteps      | 322048        |
| train/                  |               |
|    approx_kl            | 4.8080343e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.22         |
|    explained_variance   | 0.852         |
|    learning_rate        | 1e-06         |
|    loss                 | 79            |
|    n_updates            | 6280          |
|    policy_gradient_loss | -0.000177     |
|    value_loss           | 142           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 630          |
|    time_elapsed         | 20806   

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 640          |
|    time_elapsed         | 21224        |
|    total_timesteps      | 327680       |
| train/                  |              |
|    approx_kl            | 0.0006787693 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.35        |
|    explained_variance   | -0.0183      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0387       |
|    n_updates            | 6390         |
|    policy_gradient_loss | -0.000808    |
|    value_loss           | 0.111        |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 641         |
|    time_elapsed         | 21263       |
|    total_times

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 651          |
|    time_elapsed         | 21654        |
|    total_timesteps      | 333312       |
| train/                  |              |
|    approx_kl            | 0.0007289187 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.28        |
|    explained_variance   | 0.0563       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0514       |
|    n_updates            | 6500         |
|    policy_gradient_loss | -0.000687    |
|    value_loss           | 0.143        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 652           |
|    time_elapsed         | 21687         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 662           |
|    time_elapsed         | 22003         |
|    total_timesteps      | 338944        |
| train/                  |               |
|    approx_kl            | 0.00041777012 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.42         |
|    explained_variance   | -0.0554       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.215         |
|    n_updates            | 6610          |
|    policy_gradient_loss | -0.000495     |
|    value_loss           | 0.312         |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 663         |
|    time_elapsed         | 22033       

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 673          |
|    time_elapsed         | 22328        |
|    total_timesteps      | 344576       |
| train/                  |              |
|    approx_kl            | 0.0018603284 |
|    clip_fraction        | 0.00527      |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.32        |
|    explained_variance   | -0.166       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0677       |
|    n_updates            | 6720         |
|    policy_gradient_loss | -0.00327     |
|    value_loss           | 0.116        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 674          |
|    time_elapsed         | 22357        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 684          |
|    time_elapsed         | 22648        |
|    total_timesteps      | 350208       |
| train/                  |              |
|    approx_kl            | 0.0031082747 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.18        |
|    explained_variance   | -0.218       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0403       |
|    n_updates            | 6830         |
|    policy_gradient_loss | -0.00281     |
|    value_loss           | 0.182        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 685          |
|    time_elapsed         | 22678        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 695           |
|    time_elapsed         | 22968         |
|    total_timesteps      | 355840        |
| train/                  |               |
|    approx_kl            | 0.00027118693 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.14         |
|    explained_variance   | -0.0278       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0796        |
|    n_updates            | 6940          |
|    policy_gradient_loss | -0.000584     |
|    value_loss           | 0.12          |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 696           |
|    time_elapsed         | 2299

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 706          |
|    time_elapsed         | 23277        |
|    total_timesteps      | 361472       |
| train/                  |              |
|    approx_kl            | 0.0034403382 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.05        |
|    explained_variance   | -0.0456      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.1          |
|    n_updates            | 7050         |
|    policy_gradient_loss | -0.00283     |
|    value_loss           | 0.121        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 707           |
|    time_elapsed         | 23305         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 717           |
|    time_elapsed         | 23589         |
|    total_timesteps      | 367104        |
| train/                  |               |
|    approx_kl            | 0.00087109185 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.03         |
|    explained_variance   | -0.0993       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0471        |
|    n_updates            | 7160          |
|    policy_gradient_loss | -0.00153      |
|    value_loss           | 0.2           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 718           |
|    time_elapsed         | 2361

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 728          |
|    time_elapsed         | 23912        |
|    total_timesteps      | 372736       |
| train/                  |              |
|    approx_kl            | 0.0052712783 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.822       |
|    explained_variance   | 0.016        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.121        |
|    n_updates            | 7270         |
|    policy_gradient_loss | -0.00449     |
|    value_loss           | 0.145        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 729          |
|    time_elapsed         | 23942        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 739          |
|    time_elapsed         | 24231        |
|    total_timesteps      | 378368       |
| train/                  |              |
|    approx_kl            | 0.0003239198 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.407       |
|    explained_variance   | 0.313        |
|    learning_rate        | 1e-06        |
|    loss                 | 81.1         |
|    n_updates            | 7380         |
|    policy_gradient_loss | 0.000847     |
|    value_loss           | 323          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 740          |
|    time_elapsed         | 24260        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 750          |
|    time_elapsed         | 24542        |
|    total_timesteps      | 384000       |
| train/                  |              |
|    approx_kl            | 0.0021920968 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.825       |
|    explained_variance   | -0.171       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0599       |
|    n_updates            | 7490         |
|    policy_gradient_loss | -0.00188     |
|    value_loss           | 0.123        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 751          |
|    time_elapsed         | 24571        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 761          |
|    time_elapsed         | 24856        |
|    total_timesteps      | 389632       |
| train/                  |              |
|    approx_kl            | 8.489587e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.66        |
|    explained_variance   | 0.688        |
|    learning_rate        | 1e-06        |
|    loss                 | 31.4         |
|    n_updates            | 7600         |
|    policy_gradient_loss | 0.000433     |
|    value_loss           | 133          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 762           |
|    time_elapsed         | 24883         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 772           |
|    time_elapsed         | 25166         |
|    total_timesteps      | 395264        |
| train/                  |               |
|    approx_kl            | 0.00038272352 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.701        |
|    explained_variance   | -0.265        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.343         |
|    n_updates            | 7710          |
|    policy_gradient_loss | -0.000107     |
|    value_loss           | 5.89          |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 773           |
|    time_elapsed         | 2519

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 783          |
|    time_elapsed         | 25492        |
|    total_timesteps      | 400896       |
| train/                  |              |
|    approx_kl            | 0.0030639418 |
|    clip_fraction        | 0.0189       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.863       |
|    explained_variance   | -0.0114      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0467       |
|    n_updates            | 7820         |
|    policy_gradient_loss | -0.00235     |
|    value_loss           | 0.111        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 784          |
|    time_elapsed         | 25521        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 794           |
|    time_elapsed         | 25815         |
|    total_timesteps      | 406528        |
| train/                  |               |
|    approx_kl            | 0.00035455707 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.02         |
|    explained_variance   | -0.0285       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.124         |
|    n_updates            | 7930          |
|    policy_gradient_loss | -0.000514     |
|    value_loss           | 0.304         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 795          |
|    time_elapsed         | 25845   

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 805          |
|    time_elapsed         | 26139        |
|    total_timesteps      | 412160       |
| train/                  |              |
|    approx_kl            | 0.0036436692 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.02        |
|    explained_variance   | -0.343       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.23         |
|    n_updates            | 8040         |
|    policy_gradient_loss | -0.00242     |
|    value_loss           | 2.15         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 806           |
|    time_elapsed         | 26168         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 816          |
|    time_elapsed         | 26500        |
|    total_timesteps      | 417792       |
| train/                  |              |
|    approx_kl            | 0.0022621886 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.973       |
|    explained_variance   | -0.453       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.077        |
|    n_updates            | 8150         |
|    policy_gradient_loss | -0.00244     |
|    value_loss           | 0.202        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 817           |
|    time_elapsed         | 26533         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 827           |
|    time_elapsed         | 26832         |
|    total_timesteps      | 423424        |
| train/                  |               |
|    approx_kl            | 0.00054568634 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.949        |
|    explained_variance   | -0.151        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0695        |
|    n_updates            | 8260          |
|    policy_gradient_loss | -0.00112      |
|    value_loss           | 0.152         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 828          |
|    time_elapsed         | 26860   

-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 838         |
|    time_elapsed         | 27172       |
|    total_timesteps      | 429056      |
| train/                  |             |
|    approx_kl            | 0.000307056 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.967      |
|    explained_variance   | -0.152      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.152       |
|    n_updates            | 8370        |
|    policy_gradient_loss | -0.000153   |
|    value_loss           | 0.765       |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 839          |
|    time_elapsed         | 27202        |
|    total_timesteps      | 4

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 849          |
|    time_elapsed         | 27549        |
|    total_timesteps      | 434688       |
| train/                  |              |
|    approx_kl            | 0.0029680333 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.02        |
|    explained_variance   | -0.164       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0526       |
|    n_updates            | 8480         |
|    policy_gradient_loss | -0.00182     |
|    value_loss           | 0.12         |
------------------------------------------
--------------------------------------------
| time/                   |                |
|    fps                  | 15             |
|    iterations           | 850            |
|    time_elapsed         | 27579          |
|

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 860          |
|    time_elapsed         | 27884        |
|    total_timesteps      | 440320       |
| train/                  |              |
|    approx_kl            | 0.0005435196 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.15        |
|    explained_variance   | -0.127       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0362       |
|    n_updates            | 8590         |
|    policy_gradient_loss | -0.00087     |
|    value_loss           | 0.117        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 861          |
|    time_elapsed         | 27912        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 871          |
|    time_elapsed         | 28207        |
|    total_timesteps      | 445952       |
| train/                  |              |
|    approx_kl            | 0.0047166776 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.23        |
|    explained_variance   | -0.0417      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0551       |
|    n_updates            | 8700         |
|    policy_gradient_loss | -0.00371     |
|    value_loss           | 0.175        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 872           |
|    time_elapsed         | 28239         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 882           |
|    time_elapsed         | 28556         |
|    total_timesteps      | 451584        |
| train/                  |               |
|    approx_kl            | 0.00013739662 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.969        |
|    explained_variance   | 0.533         |
|    learning_rate        | 1e-06         |
|    loss                 | 242           |
|    n_updates            | 8810          |
|    policy_gradient_loss | 0.000107      |
|    value_loss           | 407           |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 883         |
|    time_elapsed         | 28590       

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 893          |
|    time_elapsed         | 28941        |
|    total_timesteps      | 457216       |
| train/                  |              |
|    approx_kl            | 0.0005563318 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.18        |
|    explained_variance   | -0.118       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.104        |
|    n_updates            | 8920         |
|    policy_gradient_loss | -0.00134     |
|    value_loss           | 0.137        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 894          |
|    time_elapsed         | 28976        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 904          |
|    time_elapsed         | 29323        |
|    total_timesteps      | 462848       |
| train/                  |              |
|    approx_kl            | 0.0025633406 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.17        |
|    explained_variance   | -0.016       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0742       |
|    n_updates            | 9030         |
|    policy_gradient_loss | -0.00194     |
|    value_loss           | 0.28         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 905           |
|    time_elapsed         | 29354         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 915          |
|    time_elapsed         | 29655        |
|    total_timesteps      | 468480       |
| train/                  |              |
|    approx_kl            | 0.0018746679 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.23        |
|    explained_variance   | -0.125       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0656       |
|    n_updates            | 9140         |
|    policy_gradient_loss | -0.00233     |
|    value_loss           | 0.15         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 916          |
|    time_elapsed         | 29683        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 926          |
|    time_elapsed         | 29976        |
|    total_timesteps      | 474112       |
| train/                  |              |
|    approx_kl            | 0.0022974932 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.25        |
|    explained_variance   | -0.0396      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0532       |
|    n_updates            | 9250         |
|    policy_gradient_loss | -0.00303     |
|    value_loss           | 0.144        |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 927         |
|    time_elapsed         | 30006       |
|    total_times

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 937          |
|    time_elapsed         | 30302        |
|    total_timesteps      | 479744       |
| train/                  |              |
|    approx_kl            | 0.0032169707 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.22        |
|    explained_variance   | -0.22        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0945       |
|    n_updates            | 9360         |
|    policy_gradient_loss | -0.00216     |
|    value_loss           | 0.287        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 938          |
|    time_elapsed         | 30330        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 948           |
|    time_elapsed         | 30623         |
|    total_timesteps      | 485376        |
| train/                  |               |
|    approx_kl            | 0.00033926987 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.2          |
|    explained_variance   | -0.172        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.239         |
|    n_updates            | 9470          |
|    policy_gradient_loss | -5.52e-05     |
|    value_loss           | 0.472         |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 949         |
|    time_elapsed         | 30653       

-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 959         |
|    time_elapsed         | 30943       |
|    total_timesteps      | 491008      |
| train/                  |             |
|    approx_kl            | 0.011144007 |
|    clip_fraction        | 0.0686      |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.19       |
|    explained_variance   | -0.105      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0701      |
|    n_updates            | 9580        |
|    policy_gradient_loss | -0.0121     |
|    value_loss           | 0.108       |
-----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 960           |
|    time_elapsed         | 30971         |
|    total_timesteps    

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 970          |
|    time_elapsed         | 31258        |
|    total_timesteps      | 496640       |
| train/                  |              |
|    approx_kl            | 0.0056771208 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.15        |
|    explained_variance   | -0.206       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0585       |
|    n_updates            | 9690         |
|    policy_gradient_loss | -0.00362     |
|    value_loss           | 0.238        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 971          |
|    time_elapsed         | 31287        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 981          |
|    time_elapsed         | 31594        |
|    total_timesteps      | 502272       |
| train/                  |              |
|    approx_kl            | 0.0031294967 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.07        |
|    explained_variance   | 0.0312       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0764       |
|    n_updates            | 9800         |
|    policy_gradient_loss | -0.00213     |
|    value_loss           | 0.432        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 982           |
|    time_elapsed         | 31624         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 992           |
|    time_elapsed         | 31938         |
|    total_timesteps      | 507904        |
| train/                  |               |
|    approx_kl            | 0.00055744837 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.05         |
|    explained_variance   | 0.0163        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.156         |
|    n_updates            | 9910          |
|    policy_gradient_loss | -0.000608     |
|    value_loss           | 0.38          |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 993          |
|    time_elapsed         | 31966   

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 1003         |
|    time_elapsed         | 32260        |
|    total_timesteps      | 513536       |
| train/                  |              |
|    approx_kl            | 7.080799e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.923       |
|    explained_variance   | 0.327        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0686       |
|    n_updates            | 10020        |
|    policy_gradient_loss | -0.000164    |
|    value_loss           | 0.301        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 1004          |
|    time_elapsed         | 32289         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 1014         |
|    time_elapsed         | 32583        |
|    total_timesteps      | 519168       |
| train/                  |              |
|    approx_kl            | 0.0014247551 |
|    clip_fraction        | 0.00176      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.858       |
|    explained_variance   | -0.149       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0605       |
|    n_updates            | 10130        |
|    policy_gradient_loss | -0.00171     |
|    value_loss           | 0.423        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 1015          |
|    time_elapsed         | 32612         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 1025         |
|    time_elapsed         | 32909        |
|    total_timesteps      | 524800       |
| train/                  |              |
|    approx_kl            | 0.0002326566 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.904       |
|    explained_variance   | 0.74         |
|    learning_rate        | 1e-06        |
|    loss                 | 236          |
|    n_updates            | 10240        |
|    policy_gradient_loss | 0.000562     |
|    value_loss           | 331          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 1026          |
|    time_elapsed         | 32940         |
|    t

-----------------------------------------
| time/                   |             |
|    fps                  | 15          |
|    iterations           | 1036        |
|    time_elapsed         | 33236       |
|    total_timesteps      | 530432      |
| train/                  |             |
|    approx_kl            | 0.001035758 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.954      |
|    explained_variance   | 0.14        |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0757      |
|    n_updates            | 10350       |
|    policy_gradient_loss | -0.000894   |
|    value_loss           | 0.173       |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 1037         |
|    time_elapsed         | 33265        |
|    total_timesteps      | 5

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 1047         |
|    time_elapsed         | 33558        |
|    total_timesteps      | 536064       |
| train/                  |              |
|    approx_kl            | 0.0006332196 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.715       |
|    explained_variance   | -0.0253      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.203        |
|    n_updates            | 10460        |
|    policy_gradient_loss | -0.000813    |
|    value_loss           | 1.68         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 1048          |
|    time_elapsed         | 33588         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 15           |
|    iterations           | 1058         |
|    time_elapsed         | 33893        |
|    total_timesteps      | 541696       |
| train/                  |              |
|    approx_kl            | 9.138486e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.401       |
|    explained_variance   | -0.159       |
|    learning_rate        | 1e-06        |
|    loss                 | 286          |
|    n_updates            | 10570        |
|    policy_gradient_loss | -0.000106    |
|    value_loss           | 756          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 1059          |
|    time_elapsed         | 33924         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 1069          |
|    time_elapsed         | 34218         |
|    total_timesteps      | 547328        |
| train/                  |               |
|    approx_kl            | 2.7863076e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.435        |
|    explained_variance   | 0.76          |
|    learning_rate        | 1e-06         |
|    loss                 | 156           |
|    n_updates            | 10680         |
|    policy_gradient_loss | -0.000178     |
|    value_loss           | 249           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 15            |
|    iterations           | 1070          |
|    time_elapsed         | 3424

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1080          |
|    time_elapsed         | 34541         |
|    total_timesteps      | 552960        |
| train/                  |               |
|    approx_kl            | 2.4252804e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.44         |
|    explained_variance   | 0.195         |
|    learning_rate        | 1e-06         |
|    loss                 | 344           |
|    n_updates            | 10790         |
|    policy_gradient_loss | -0.000144     |
|    value_loss           | 885           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1081          |
|    time_elapsed         | 3457

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1091          |
|    time_elapsed         | 34869         |
|    total_timesteps      | 558592        |
| train/                  |               |
|    approx_kl            | 0.00013448647 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.351        |
|    explained_variance   | -0.0755       |
|    learning_rate        | 1e-06         |
|    loss                 | 269           |
|    n_updates            | 10900         |
|    policy_gradient_loss | 0.000376      |
|    value_loss           | 567           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1092          |
|    time_elapsed         | 3490

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1102          |
|    time_elapsed         | 35193         |
|    total_timesteps      | 564224        |
| train/                  |               |
|    approx_kl            | 1.7694896e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.418        |
|    explained_variance   | 0.777         |
|    learning_rate        | 1e-06         |
|    loss                 | 175           |
|    n_updates            | 11010         |
|    policy_gradient_loss | -7.66e-05     |
|    value_loss           | 336           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1103          |
|    time_elapsed         | 3522

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1113         |
|    time_elapsed         | 35509        |
|    total_timesteps      | 569856       |
| train/                  |              |
|    approx_kl            | 4.138227e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.333       |
|    explained_variance   | 0.277        |
|    learning_rate        | 1e-06        |
|    loss                 | 110          |
|    n_updates            | 11120        |
|    policy_gradient_loss | 0.000196     |
|    value_loss           | 859          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1114         |
|    time_elapsed         | 35540        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1124          |
|    time_elapsed         | 35834         |
|    total_timesteps      | 575488        |
| train/                  |               |
|    approx_kl            | 0.00025953096 |
|    clip_fraction        | 0.0043        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.544        |
|    explained_variance   | 0.852         |
|    learning_rate        | 1e-06         |
|    loss                 | 18.2          |
|    n_updates            | 11230         |
|    policy_gradient_loss | 0.000786      |
|    value_loss           | 97.3          |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1125         |
|    time_elapsed         | 35862   

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1135         |
|    time_elapsed         | 36155        |
|    total_timesteps      | 581120       |
| train/                  |              |
|    approx_kl            | 0.0021719863 |
|    clip_fraction        | 0.025        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.453       |
|    explained_variance   | 0.838        |
|    learning_rate        | 1e-06        |
|    loss                 | 62.2         |
|    n_updates            | 11340        |
|    policy_gradient_loss | -0.00247     |
|    value_loss           | 173          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1136         |
|    time_elapsed         | 36185        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1146          |
|    time_elapsed         | 36484         |
|    total_timesteps      | 586752        |
| train/                  |               |
|    approx_kl            | 2.2717286e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.243        |
|    explained_variance   | 0.0367        |
|    learning_rate        | 1e-06         |
|    loss                 | 607           |
|    n_updates            | 11450         |
|    policy_gradient_loss | -9.34e-05     |
|    value_loss           | 782           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1147          |
|    time_elapsed         | 3651

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1157         |
|    time_elapsed         | 36806        |
|    total_timesteps      | 592384       |
| train/                  |              |
|    approx_kl            | 0.0009629483 |
|    clip_fraction        | 0.000977     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.304       |
|    explained_variance   | 0.811        |
|    learning_rate        | 1e-06        |
|    loss                 | 81.9         |
|    n_updates            | 11560        |
|    policy_gradient_loss | 6.13e-06     |
|    value_loss           | 215          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1158         |
|    time_elapsed         | 36837        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1168          |
|    time_elapsed         | 37126         |
|    total_timesteps      | 598016        |
| train/                  |               |
|    approx_kl            | 0.00041845825 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.26         |
|    explained_variance   | 0.315         |
|    learning_rate        | 1e-06         |
|    loss                 | 207           |
|    n_updates            | 11670         |
|    policy_gradient_loss | -0.00113      |
|    value_loss           | 388           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1169          |
|    time_elapsed         | 3715

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1179          |
|    time_elapsed         | 37448         |
|    total_timesteps      | 603648        |
| train/                  |               |
|    approx_kl            | 0.00028267142 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.284        |
|    explained_variance   | 0.201         |
|    learning_rate        | 1e-06         |
|    loss                 | 421           |
|    n_updates            | 11780         |
|    policy_gradient_loss | -0.000363     |
|    value_loss           | 855           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1180         |
|    time_elapsed         | 37477   

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1190          |
|    time_elapsed         | 37764         |
|    total_timesteps      | 609280        |
| train/                  |               |
|    approx_kl            | 0.00062964414 |
|    clip_fraction        | 0.00176       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.36         |
|    explained_variance   | 0.698         |
|    learning_rate        | 1e-06         |
|    loss                 | 32.3          |
|    n_updates            | 11890         |
|    policy_gradient_loss | -0.00207      |
|    value_loss           | 160           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1191         |
|    time_elapsed         | 37793   

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1201         |
|    time_elapsed         | 38089        |
|    total_timesteps      | 614912       |
| train/                  |              |
|    approx_kl            | 0.0011777122 |
|    clip_fraction        | 0.00801      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.221       |
|    explained_variance   | 0.688        |
|    learning_rate        | 1e-06        |
|    loss                 | 192          |
|    n_updates            | 12000        |
|    policy_gradient_loss | -0.00204     |
|    value_loss           | 312          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1202         |
|    time_elapsed         | 38120        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1212         |
|    time_elapsed         | 38416        |
|    total_timesteps      | 620544       |
| train/                  |              |
|    approx_kl            | 0.0005726388 |
|    clip_fraction        | 0.00137      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.167       |
|    explained_variance   | 0.228        |
|    learning_rate        | 1e-06        |
|    loss                 | 164          |
|    n_updates            | 12110        |
|    policy_gradient_loss | -0.000882    |
|    value_loss           | 820          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1213         |
|    time_elapsed         | 38444        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1223         |
|    time_elapsed         | 38735        |
|    total_timesteps      | 626176       |
| train/                  |              |
|    approx_kl            | 0.0004597291 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.298       |
|    explained_variance   | 0.893        |
|    learning_rate        | 1e-06        |
|    loss                 | 60           |
|    n_updates            | 12220        |
|    policy_gradient_loss | -0.000502    |
|    value_loss           | 200          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1224          |
|    time_elapsed         | 38764         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1234         |
|    time_elapsed         | 39051        |
|    total_timesteps      | 631808       |
| train/                  |              |
|    approx_kl            | 0.0005188718 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.391       |
|    explained_variance   | 0.914        |
|    learning_rate        | 1e-06        |
|    loss                 | 73.4         |
|    n_updates            | 12330        |
|    policy_gradient_loss | -0.000658    |
|    value_loss           | 186          |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 16          |
|    iterations           | 1235        |
|    time_elapsed         | 39080       |
|    total_times

-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1245          |
|    time_elapsed         | 39366         |
|    total_timesteps      | 637440        |
| train/                  |               |
|    approx_kl            | 0.00015080709 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.332        |
|    explained_variance   | 0.451         |
|    learning_rate        | 1e-06         |
|    loss                 | 213           |
|    n_updates            | 12440         |
|    policy_gradient_loss | -0.000907     |
|    value_loss           | 480           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1246          |
|    time_elapsed         | 3939

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1256         |
|    time_elapsed         | 39683        |
|    total_timesteps      | 643072       |
| train/                  |              |
|    approx_kl            | 5.812035e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.222       |
|    explained_variance   | 0.755        |
|    learning_rate        | 1e-06        |
|    loss                 | 128          |
|    n_updates            | 12550        |
|    policy_gradient_loss | 2.34e-06     |
|    value_loss           | 423          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1257          |
|    time_elapsed         | 39711         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 16           |
|    iterations           | 1267         |
|    time_elapsed         | 40001        |
|    total_timesteps      | 648704       |
| train/                  |              |
|    approx_kl            | 3.433251e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.245       |
|    explained_variance   | 0.538        |
|    learning_rate        | 1e-06        |
|    loss                 | 144          |
|    n_updates            | 12660        |
|    policy_gradient_loss | -0.000173    |
|    value_loss           | 336          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 16            |
|    iterations           | 1268          |
|    time_elapsed         | 40032         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1278          |
|    time_elapsed         | 81449         |
|    total_timesteps      | 654336        |
| train/                  |               |
|    approx_kl            | 0.00075915584 |
|    clip_fraction        | 0.0145        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.241        |
|    explained_variance   | 0.766         |
|    learning_rate        | 1e-06         |
|    loss                 | 151           |
|    n_updates            | 12770         |
|    policy_gradient_loss | -0.00215      |
|    value_loss           | 275           |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 8           |
|    iterations           | 1279        |
|    time_elapsed         | 81488       

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1289         |
|    time_elapsed         | 81863        |
|    total_timesteps      | 659968       |
| train/                  |              |
|    approx_kl            | 0.0016858286 |
|    clip_fraction        | 0.0162       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.28        |
|    explained_variance   | 0.541        |
|    learning_rate        | 1e-06        |
|    loss                 | 126          |
|    n_updates            | 12880        |
|    policy_gradient_loss | -0.00213     |
|    value_loss           | 356          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1290         |
|    time_elapsed         | 81897        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1300          |
|    time_elapsed         | 82289         |
|    total_timesteps      | 665600        |
| train/                  |               |
|    approx_kl            | 0.00029750296 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.259        |
|    explained_variance   | 0.259         |
|    learning_rate        | 1e-06         |
|    loss                 | 437           |
|    n_updates            | 12990         |
|    policy_gradient_loss | -0.000554     |
|    value_loss           | 865           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1301         |
|    time_elapsed         | 82322   

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1311          |
|    time_elapsed         | 82672         |
|    total_timesteps      | 671232        |
| train/                  |               |
|    approx_kl            | 0.00020298758 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.24         |
|    explained_variance   | 0.478         |
|    learning_rate        | 1e-06         |
|    loss                 | 304           |
|    n_updates            | 13100         |
|    policy_gradient_loss | -0.000245     |
|    value_loss           | 510           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1312          |
|    time_elapsed         | 8271

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1322          |
|    time_elapsed         | 83049         |
|    total_timesteps      | 676864        |
| train/                  |               |
|    approx_kl            | 0.00014107022 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.245        |
|    explained_variance   | 0.44          |
|    learning_rate        | 1e-06         |
|    loss                 | 107           |
|    n_updates            | 13210         |
|    policy_gradient_loss | 1.58e-05      |
|    value_loss           | 180           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1323          |
|    time_elapsed         | 8308

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1333         |
|    time_elapsed         | 83571        |
|    total_timesteps      | 682496       |
| train/                  |              |
|    approx_kl            | 0.0012378937 |
|    clip_fraction        | 0.00332      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.301       |
|    explained_variance   | 0.252        |
|    learning_rate        | 1e-06        |
|    loss                 | 357          |
|    n_updates            | 13320        |
|    policy_gradient_loss | -0.00173     |
|    value_loss           | 700          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1334          |
|    time_elapsed         | 83613         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1344         |
|    time_elapsed         | 84005        |
|    total_timesteps      | 688128       |
| train/                  |              |
|    approx_kl            | 0.0013873588 |
|    clip_fraction        | 0.00176      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.518       |
|    explained_variance   | 0.737        |
|    learning_rate        | 1e-06        |
|    loss                 | 67.9         |
|    n_updates            | 13430        |
|    policy_gradient_loss | -0.000881    |
|    value_loss           | 95.3         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1345         |
|    time_elapsed         | 84040        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1355         |
|    time_elapsed         | 84460        |
|    total_timesteps      | 693760       |
| train/                  |              |
|    approx_kl            | 1.771038e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.341       |
|    explained_variance   | 0.75         |
|    learning_rate        | 1e-06        |
|    loss                 | 141          |
|    n_updates            | 13540        |
|    policy_gradient_loss | 0.000197     |
|    value_loss           | 251          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1356          |
|    time_elapsed         | 84504         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1366         |
|    time_elapsed         | 84950        |
|    total_timesteps      | 699392       |
| train/                  |              |
|    approx_kl            | 7.370324e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.243       |
|    explained_variance   | 0.778        |
|    learning_rate        | 1e-06        |
|    loss                 | 172          |
|    n_updates            | 13650        |
|    policy_gradient_loss | -0.000159    |
|    value_loss           | 293          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1367         |
|    time_elapsed         | 84987        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1377          |
|    time_elapsed         | 85452         |
|    total_timesteps      | 705024        |
| train/                  |               |
|    approx_kl            | 0.00031521742 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.207        |
|    explained_variance   | 0.769         |
|    learning_rate        | 1e-06         |
|    loss                 | 177           |
|    n_updates            | 13760         |
|    policy_gradient_loss | -0.000941     |
|    value_loss           | 344           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1378         |
|    time_elapsed         | 85489   

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1388          |
|    time_elapsed         | 85882         |
|    total_timesteps      | 710656        |
| train/                  |               |
|    approx_kl            | 0.00064432644 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.211        |
|    explained_variance   | 0.625         |
|    learning_rate        | 1e-06         |
|    loss                 | 108           |
|    n_updates            | 13870         |
|    policy_gradient_loss | -0.000489     |
|    value_loss           | 335           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1389          |
|    time_elapsed         | 8592

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1399          |
|    time_elapsed         | 86285         |
|    total_timesteps      | 716288        |
| train/                  |               |
|    approx_kl            | 0.00012716337 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.216        |
|    explained_variance   | 0.66          |
|    learning_rate        | 1e-06         |
|    loss                 | 283           |
|    n_updates            | 13980         |
|    policy_gradient_loss | -0.000191     |
|    value_loss           | 606           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1400         |
|    time_elapsed         | 86327   

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1410         |
|    time_elapsed         | 86703        |
|    total_timesteps      | 721920       |
| train/                  |              |
|    approx_kl            | 0.0007804221 |
|    clip_fraction        | 0.000195     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.224       |
|    explained_variance   | 0.795        |
|    learning_rate        | 1e-06        |
|    loss                 | 145          |
|    n_updates            | 14090        |
|    policy_gradient_loss | -0.000689    |
|    value_loss           | 331          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1411         |
|    time_elapsed         | 86741        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1421          |
|    time_elapsed         | 87123         |
|    total_timesteps      | 727552        |
| train/                  |               |
|    approx_kl            | 0.00036237238 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.188        |
|    explained_variance   | 0.347         |
|    learning_rate        | 1e-06         |
|    loss                 | 528           |
|    n_updates            | 14200         |
|    policy_gradient_loss | -0.000437     |
|    value_loss           | 669           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1422         |
|    time_elapsed         | 87160   

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1432          |
|    time_elapsed         | 87537         |
|    total_timesteps      | 733184        |
| train/                  |               |
|    approx_kl            | 0.00058732636 |
|    clip_fraction        | 0.00352       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.137        |
|    explained_variance   | 0.853         |
|    learning_rate        | 1e-06         |
|    loss                 | 83.2          |
|    n_updates            | 14310         |
|    policy_gradient_loss | -0.000471     |
|    value_loss           | 364           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1433          |
|    time_elapsed         | 8756

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1443         |
|    time_elapsed         | 87873        |
|    total_timesteps      | 738816       |
| train/                  |              |
|    approx_kl            | 0.0019480371 |
|    clip_fraction        | 0.0127       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.25        |
|    explained_variance   | 0.74         |
|    learning_rate        | 1e-06        |
|    loss                 | 146          |
|    n_updates            | 14420        |
|    policy_gradient_loss | -0.00233     |
|    value_loss           | 319          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1444         |
|    time_elapsed         | 87911        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1454         |
|    time_elapsed         | 88295        |
|    total_timesteps      | 744448       |
| train/                  |              |
|    approx_kl            | 0.0012655839 |
|    clip_fraction        | 0.00664      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.294       |
|    explained_variance   | 0.595        |
|    learning_rate        | 1e-06        |
|    loss                 | 384          |
|    n_updates            | 14530        |
|    policy_gradient_loss | -0.00132     |
|    value_loss           | 601          |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 8           |
|    iterations           | 1455        |
|    time_elapsed         | 88334       |
|    total_times

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1465         |
|    time_elapsed         | 88704        |
|    total_timesteps      | 750080       |
| train/                  |              |
|    approx_kl            | 0.0003730394 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.522       |
|    explained_variance   | 0.079        |
|    learning_rate        | 1e-06        |
|    loss                 | 5.96         |
|    n_updates            | 14640        |
|    policy_gradient_loss | -0.000109    |
|    value_loss           | 66.6         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1466         |
|    time_elapsed         | 88741        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1476         |
|    time_elapsed         | 89089        |
|    total_timesteps      | 755712       |
| train/                  |              |
|    approx_kl            | 0.0003177562 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.413       |
|    explained_variance   | 0.909        |
|    learning_rate        | 1e-06        |
|    loss                 | 84.6         |
|    n_updates            | 14750        |
|    policy_gradient_loss | -0.00122     |
|    value_loss           | 163          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1477          |
|    time_elapsed         | 89121         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1487          |
|    time_elapsed         | 89483         |
|    total_timesteps      | 761344        |
| train/                  |               |
|    approx_kl            | 0.00027320255 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.358        |
|    explained_variance   | 0.751         |
|    learning_rate        | 1e-06         |
|    loss                 | 274           |
|    n_updates            | 14860         |
|    policy_gradient_loss | -0.00055      |
|    value_loss           | 746           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1488         |
|    time_elapsed         | 89518   

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1498          |
|    time_elapsed         | 89857         |
|    total_timesteps      | 766976        |
| train/                  |               |
|    approx_kl            | 2.8202427e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.24         |
|    explained_variance   | 0.688         |
|    learning_rate        | 1e-06         |
|    loss                 | 44.3          |
|    n_updates            | 14970         |
|    policy_gradient_loss | -4.94e-05     |
|    value_loss           | 104           |
-------------------------------------------
--------------------------------------------
| time/                   |                |
|    fps                  | 8              |
|    iterations           | 1499           |
|    time_elapsed         | 

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1509          |
|    time_elapsed         | 90241         |
|    total_timesteps      | 772608        |
| train/                  |               |
|    approx_kl            | 0.00093323784 |
|    clip_fraction        | 0.000586      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.291        |
|    explained_variance   | 0.222         |
|    learning_rate        | 1e-06         |
|    loss                 | 699           |
|    n_updates            | 15080         |
|    policy_gradient_loss | -0.00066      |
|    value_loss           | 996           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1510         |
|    time_elapsed         | 90272   

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1520          |
|    time_elapsed         | 90641         |
|    total_timesteps      | 778240        |
| train/                  |               |
|    approx_kl            | 0.00034489168 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.265        |
|    explained_variance   | 0.429         |
|    learning_rate        | 1e-06         |
|    loss                 | 141           |
|    n_updates            | 15190         |
|    policy_gradient_loss | -0.000754     |
|    value_loss           | 377           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1521          |
|    time_elapsed         | 9067

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1531          |
|    time_elapsed         | 90996         |
|    total_timesteps      | 783872        |
| train/                  |               |
|    approx_kl            | 0.00018486357 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.16         |
|    explained_variance   | 0.4           |
|    learning_rate        | 1e-06         |
|    loss                 | 89.1          |
|    n_updates            | 15300         |
|    policy_gradient_loss | -0.000289     |
|    value_loss           | 205           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1532          |
|    time_elapsed         | 9102

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1542         |
|    time_elapsed         | 91365        |
|    total_timesteps      | 789504       |
| train/                  |              |
|    approx_kl            | 8.177885e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.154       |
|    explained_variance   | 0.84         |
|    learning_rate        | 1e-06        |
|    loss                 | 92.9         |
|    n_updates            | 15410        |
|    policy_gradient_loss | -0.000103    |
|    value_loss           | 200          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1543          |
|    time_elapsed         | 91397         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1553          |
|    time_elapsed         | 91748         |
|    total_timesteps      | 795136        |
| train/                  |               |
|    approx_kl            | 5.3008436e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.172        |
|    explained_variance   | 0.563         |
|    learning_rate        | 1e-06         |
|    loss                 | 78.5          |
|    n_updates            | 15520         |
|    policy_gradient_loss | -0.000263     |
|    value_loss           | 201           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1554         |
|    time_elapsed         | 91787   

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1564          |
|    time_elapsed         | 92166         |
|    total_timesteps      | 800768        |
| train/                  |               |
|    approx_kl            | 0.00010802422 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.263        |
|    explained_variance   | 0.748         |
|    learning_rate        | 1e-06         |
|    loss                 | 98.1          |
|    n_updates            | 15630         |
|    policy_gradient_loss | -0.000268     |
|    value_loss           | 239           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1565          |
|    time_elapsed         | 9220

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1575         |
|    time_elapsed         | 92578        |
|    total_timesteps      | 806400       |
| train/                  |              |
|    approx_kl            | 0.0005029085 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.462       |
|    explained_variance   | 0.757        |
|    learning_rate        | 1e-06        |
|    loss                 | 90.3         |
|    n_updates            | 15740        |
|    policy_gradient_loss | -0.000422    |
|    value_loss           | 203          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1576         |
|    time_elapsed         | 92616        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1586         |
|    time_elapsed         | 93003        |
|    total_timesteps      | 812032       |
| train/                  |              |
|    approx_kl            | 0.0011743755 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.361       |
|    explained_variance   | 0.88         |
|    learning_rate        | 1e-06        |
|    loss                 | 168          |
|    n_updates            | 15850        |
|    policy_gradient_loss | -0.000664    |
|    value_loss           | 245          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1587         |
|    time_elapsed         | 93037        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1597         |
|    time_elapsed         | 93392        |
|    total_timesteps      | 817664       |
| train/                  |              |
|    approx_kl            | 8.255243e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.309       |
|    explained_variance   | 0.938        |
|    learning_rate        | 1e-06        |
|    loss                 | 133          |
|    n_updates            | 15960        |
|    policy_gradient_loss | -0.000185    |
|    value_loss           | 236          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1598         |
|    time_elapsed         | 93429        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1608         |
|    time_elapsed         | 93754        |
|    total_timesteps      | 823296       |
| train/                  |              |
|    approx_kl            | 9.895663e-05 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.279       |
|    explained_variance   | 0.261        |
|    learning_rate        | 1e-06        |
|    loss                 | 438          |
|    n_updates            | 16070        |
|    policy_gradient_loss | -4.27e-05    |
|    value_loss           | 1.53e+03     |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1609         |
|    time_elapsed         | 93782        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1619         |
|    time_elapsed         | 94114        |
|    total_timesteps      | 828928       |
| train/                  |              |
|    approx_kl            | 0.0003085517 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.278       |
|    explained_variance   | 0.694        |
|    learning_rate        | 1e-06        |
|    loss                 | 287          |
|    n_updates            | 16180        |
|    policy_gradient_loss | -0.000527    |
|    value_loss           | 626          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1620          |
|    time_elapsed         | 94147         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1630          |
|    time_elapsed         | 94451         |
|    total_timesteps      | 834560        |
| train/                  |               |
|    approx_kl            | 0.00053334027 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.276        |
|    explained_variance   | 0.885         |
|    learning_rate        | 1e-06         |
|    loss                 | 43.9          |
|    n_updates            | 16290         |
|    policy_gradient_loss | -0.000267     |
|    value_loss           | 129           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1631          |
|    time_elapsed         | 9448

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1641         |
|    time_elapsed         | 94791        |
|    total_timesteps      | 840192       |
| train/                  |              |
|    approx_kl            | 0.0006652913 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.282       |
|    explained_variance   | 0.779        |
|    learning_rate        | 1e-06        |
|    loss                 | 117          |
|    n_updates            | 16400        |
|    policy_gradient_loss | -0.000391    |
|    value_loss           | 216          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1642          |
|    time_elapsed         | 94822         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1652         |
|    time_elapsed         | 95122        |
|    total_timesteps      | 845824       |
| train/                  |              |
|    approx_kl            | 0.0018303512 |
|    clip_fraction        | 0.0342       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.337       |
|    explained_variance   | 0.785        |
|    learning_rate        | 1e-06        |
|    loss                 | 129          |
|    n_updates            | 16510        |
|    policy_gradient_loss | -0.00332     |
|    value_loss           | 244          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1653         |
|    time_elapsed         | 95151        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1663         |
|    time_elapsed         | 95454        |
|    total_timesteps      | 851456       |
| train/                  |              |
|    approx_kl            | 0.0005957434 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.251       |
|    explained_variance   | 0.392        |
|    learning_rate        | 1e-06        |
|    loss                 | 165          |
|    n_updates            | 16620        |
|    policy_gradient_loss | -0.000611    |
|    value_loss           | 244          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1664          |
|    time_elapsed         | 95486         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1674         |
|    time_elapsed         | 95789        |
|    total_timesteps      | 857088       |
| train/                  |              |
|    approx_kl            | 0.0010085327 |
|    clip_fraction        | 0.00293      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.298       |
|    explained_variance   | 0.799        |
|    learning_rate        | 1e-06        |
|    loss                 | 97.3         |
|    n_updates            | 16730        |
|    policy_gradient_loss | -0.00282     |
|    value_loss           | 259          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1675         |
|    time_elapsed         | 95818        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 8            |
|    iterations           | 1685         |
|    time_elapsed         | 96119        |
|    total_timesteps      | 862720       |
| train/                  |              |
|    approx_kl            | 0.0011469459 |
|    clip_fraction        | 0.00176      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.503       |
|    explained_variance   | -0.162       |
|    learning_rate        | 1e-06        |
|    loss                 | 2.03         |
|    n_updates            | 16840        |
|    policy_gradient_loss | -5.27e-05    |
|    value_loss           | 60.9         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 8             |
|    iterations           | 1686          |
|    time_elapsed         | 96150         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1696         |
|    time_elapsed         | 96451        |
|    total_timesteps      | 868352       |
| train/                  |              |
|    approx_kl            | 0.0005388835 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.483       |
|    explained_variance   | 0.682        |
|    learning_rate        | 1e-06        |
|    loss                 | 273          |
|    n_updates            | 16950        |
|    policy_gradient_loss | -0.000395    |
|    value_loss           | 712          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1697          |
|    time_elapsed         | 96479         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1707         |
|    time_elapsed         | 96806        |
|    total_timesteps      | 873984       |
| train/                  |              |
|    approx_kl            | 0.0005021059 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.414       |
|    explained_variance   | 0.727        |
|    learning_rate        | 1e-06        |
|    loss                 | 200          |
|    n_updates            | 17060        |
|    policy_gradient_loss | -0.000556    |
|    value_loss           | 487          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1708         |
|    time_elapsed         | 96841        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1718         |
|    time_elapsed         | 97187        |
|    total_timesteps      | 879616       |
| train/                  |              |
|    approx_kl            | 0.0014327904 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.623       |
|    explained_variance   | -0.0253      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.658        |
|    n_updates            | 17170        |
|    policy_gradient_loss | -0.000497    |
|    value_loss           | 3.02         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1719          |
|    time_elapsed         | 97218         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1729         |
|    time_elapsed         | 97556        |
|    total_timesteps      | 885248       |
| train/                  |              |
|    approx_kl            | 7.095758e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.51        |
|    explained_variance   | 0.901        |
|    learning_rate        | 1e-06        |
|    loss                 | 277          |
|    n_updates            | 17280        |
|    policy_gradient_loss | -2.93e-05    |
|    value_loss           | 399          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1730          |
|    time_elapsed         | 97599         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1740          |
|    time_elapsed         | 97940         |
|    total_timesteps      | 890880        |
| train/                  |               |
|    approx_kl            | 3.9307633e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.399        |
|    explained_variance   | 0.788         |
|    learning_rate        | 1e-06         |
|    loss                 | 152           |
|    n_updates            | 17390         |
|    policy_gradient_loss | -0.000128     |
|    value_loss           | 388           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1741          |
|    time_elapsed         | 9797

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1751          |
|    time_elapsed         | 98295         |
|    total_timesteps      | 896512        |
| train/                  |               |
|    approx_kl            | 2.7193222e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.358        |
|    explained_variance   | 0.688         |
|    learning_rate        | 1e-06         |
|    loss                 | 445           |
|    n_updates            | 17500         |
|    policy_gradient_loss | -2.27e-05     |
|    value_loss           | 842           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1752          |
|    time_elapsed         | 9833

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1762          |
|    time_elapsed         | 98667         |
|    total_timesteps      | 902144        |
| train/                  |               |
|    approx_kl            | 0.00053205865 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.327        |
|    explained_variance   | 0.313         |
|    learning_rate        | 1e-06         |
|    loss                 | 333           |
|    n_updates            | 17610         |
|    policy_gradient_loss | -0.000842     |
|    value_loss           | 886           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1763          |
|    time_elapsed         | 9870

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1773         |
|    time_elapsed         | 99022        |
|    total_timesteps      | 907776       |
| train/                  |              |
|    approx_kl            | 9.495532e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.25        |
|    explained_variance   | 0.0987       |
|    learning_rate        | 1e-06        |
|    loss                 | 582          |
|    n_updates            | 17720        |
|    policy_gradient_loss | -8.99e-05    |
|    value_loss           | 1.09e+03     |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1774         |
|    time_elapsed         | 99054        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1784          |
|    time_elapsed         | 99386         |
|    total_timesteps      | 913408        |
| train/                  |               |
|    approx_kl            | 0.00011317979 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.243        |
|    explained_variance   | 0.237         |
|    learning_rate        | 1e-06         |
|    loss                 | 294           |
|    n_updates            | 17830         |
|    policy_gradient_loss | -0.000325     |
|    value_loss           | 1.05e+03      |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1785          |
|    time_elapsed         | 9941

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1795         |
|    time_elapsed         | 99737        |
|    total_timesteps      | 919040       |
| train/                  |              |
|    approx_kl            | 0.0007995764 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.282       |
|    explained_variance   | 0.763        |
|    learning_rate        | 1e-06        |
|    loss                 | 256          |
|    n_updates            | 17940        |
|    policy_gradient_loss | -0.000665    |
|    value_loss           | 405          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1796         |
|    time_elapsed         | 99770        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1806         |
|    time_elapsed         | 100123       |
|    total_timesteps      | 924672       |
| train/                  |              |
|    approx_kl            | 0.0007595896 |
|    clip_fraction        | 0.00918      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.202       |
|    explained_variance   | 0.854        |
|    learning_rate        | 1e-06        |
|    loss                 | 64.9         |
|    n_updates            | 18050        |
|    policy_gradient_loss | -0.00106     |
|    value_loss           | 126          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1807          |
|    time_elapsed         | 100156        |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1817          |
|    time_elapsed         | 100469        |
|    total_timesteps      | 930304        |
| train/                  |               |
|    approx_kl            | 7.1976916e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.225        |
|    explained_variance   | 0.906         |
|    learning_rate        | 1e-06         |
|    loss                 | 85.1          |
|    n_updates            | 18160         |
|    policy_gradient_loss | -0.000264     |
|    value_loss           | 200           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1818          |
|    time_elapsed         | 1005

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1828         |
|    time_elapsed         | 100836       |
|    total_timesteps      | 935936       |
| train/                  |              |
|    approx_kl            | 8.655363e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.222       |
|    explained_variance   | 0.859        |
|    learning_rate        | 1e-06        |
|    loss                 | 125          |
|    n_updates            | 18270        |
|    policy_gradient_loss | 6.24e-06     |
|    value_loss           | 215          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1829          |
|    time_elapsed         | 100866        |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1839         |
|    time_elapsed         | 101180       |
|    total_timesteps      | 941568       |
| train/                  |              |
|    approx_kl            | 0.0020362176 |
|    clip_fraction        | 0.0193       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.164       |
|    explained_variance   | 0.853        |
|    learning_rate        | 1e-06        |
|    loss                 | 78           |
|    n_updates            | 18380        |
|    policy_gradient_loss | -0.00212     |
|    value_loss           | 192          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1840         |
|    time_elapsed         | 101211       |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1850         |
|    time_elapsed         | 101510       |
|    total_timesteps      | 947200       |
| train/                  |              |
|    approx_kl            | 0.0003099764 |
|    clip_fraction        | 0.00176      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.181       |
|    explained_variance   | 0.336        |
|    learning_rate        | 1e-06        |
|    loss                 | 355          |
|    n_updates            | 18490        |
|    policy_gradient_loss | -0.000881    |
|    value_loss           | 846          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1851          |
|    time_elapsed         | 101538        |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1861         |
|    time_elapsed         | 101833       |
|    total_timesteps      | 952832       |
| train/                  |              |
|    approx_kl            | 1.211185e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.152       |
|    explained_variance   | 0.576        |
|    learning_rate        | 1e-06        |
|    loss                 | 826          |
|    n_updates            | 18600        |
|    policy_gradient_loss | 3.39e-05     |
|    value_loss           | 1.02e+03     |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1862         |
|    time_elapsed         | 101864       |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1872          |
|    time_elapsed         | 102164        |
|    total_timesteps      | 958464        |
| train/                  |               |
|    approx_kl            | 2.1156156e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.161        |
|    explained_variance   | 0.558         |
|    learning_rate        | 1e-06         |
|    loss                 | 403           |
|    n_updates            | 18710         |
|    policy_gradient_loss | -8.85e-05     |
|    value_loss           | 791           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1873          |
|    time_elapsed         | 1021

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1883         |
|    time_elapsed         | 102498       |
|    total_timesteps      | 964096       |
| train/                  |              |
|    approx_kl            | 0.0003926407 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.201       |
|    explained_variance   | 0.803        |
|    learning_rate        | 1e-06        |
|    loss                 | 111          |
|    n_updates            | 18820        |
|    policy_gradient_loss | -0.000745    |
|    value_loss           | 473          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1884          |
|    time_elapsed         | 102529        |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1894          |
|    time_elapsed         | 102834        |
|    total_timesteps      | 969728        |
| train/                  |               |
|    approx_kl            | 0.00035947794 |
|    clip_fraction        | 0.000781      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.266        |
|    explained_variance   | 0.479         |
|    learning_rate        | 1e-06         |
|    loss                 | 406           |
|    n_updates            | 18930         |
|    policy_gradient_loss | -0.000556     |
|    value_loss           | 974           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1895         |
|    time_elapsed         | 102864  

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1905         |
|    time_elapsed         | 103173       |
|    total_timesteps      | 975360       |
| train/                  |              |
|    approx_kl            | 0.0002909694 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.204       |
|    explained_variance   | 0.44         |
|    learning_rate        | 1e-06        |
|    loss                 | 125          |
|    n_updates            | 19040        |
|    policy_gradient_loss | -0.000265    |
|    value_loss           | 379          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1906         |
|    time_elapsed         | 103205       |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1916         |
|    time_elapsed         | 103520       |
|    total_timesteps      | 980992       |
| train/                  |              |
|    approx_kl            | 0.0005198476 |
|    clip_fraction        | 0.00352      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.167       |
|    explained_variance   | 0.727        |
|    learning_rate        | 1e-06        |
|    loss                 | 150          |
|    n_updates            | 19150        |
|    policy_gradient_loss | -0.000922    |
|    value_loss           | 409          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1917          |
|    time_elapsed         | 103550        |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1927         |
|    time_elapsed         | 103900       |
|    total_timesteps      | 986624       |
| train/                  |              |
|    approx_kl            | 0.0014253259 |
|    clip_fraction        | 0.00527      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.27        |
|    explained_variance   | 0.7          |
|    learning_rate        | 1e-06        |
|    loss                 | 130          |
|    n_updates            | 19260        |
|    policy_gradient_loss | -0.000698    |
|    value_loss           | 404          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1928         |
|    time_elapsed         | 103936       |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1938         |
|    time_elapsed         | 104301       |
|    total_timesteps      | 992256       |
| train/                  |              |
|    approx_kl            | 0.0007631534 |
|    clip_fraction        | 0.000195     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.267       |
|    explained_variance   | 0.758        |
|    learning_rate        | 1e-06        |
|    loss                 | 222          |
|    n_updates            | 19370        |
|    policy_gradient_loss | -0.000634    |
|    value_loss           | 488          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1939          |
|    time_elapsed         | 104334        |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1949         |
|    time_elapsed         | 104671       |
|    total_timesteps      | 997888       |
| train/                  |              |
|    approx_kl            | 0.0008206413 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.302       |
|    explained_variance   | 0.851        |
|    learning_rate        | 1e-06        |
|    loss                 | 180          |
|    n_updates            | 19480        |
|    policy_gradient_loss | -0.000674    |
|    value_loss           | 379          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1950         |
|    time_elapsed         | 104705       |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1960          |
|    time_elapsed         | 105031        |
|    total_timesteps      | 1003520       |
| train/                  |               |
|    approx_kl            | 0.00060162484 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.302        |
|    explained_variance   | 0.803         |
|    learning_rate        | 1e-06         |
|    loss                 | 166           |
|    n_updates            | 19590         |
|    policy_gradient_loss | -0.000591     |
|    value_loss           | 395           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1961         |
|    time_elapsed         | 105061  

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1971          |
|    time_elapsed         | 105390        |
|    total_timesteps      | 1009152       |
| train/                  |               |
|    approx_kl            | 0.00031560112 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.305        |
|    explained_variance   | 0.681         |
|    learning_rate        | 1e-06         |
|    loss                 | 414           |
|    n_updates            | 19700         |
|    policy_gradient_loss | -0.000206     |
|    value_loss           | 860           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 1972         |
|    time_elapsed         | 105424  

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1982          |
|    time_elapsed         | 105814        |
|    total_timesteps      | 1014784       |
| train/                  |               |
|    approx_kl            | 0.00027951715 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.223        |
|    explained_variance   | 0.841         |
|    learning_rate        | 1e-06         |
|    loss                 | 199           |
|    n_updates            | 19810         |
|    policy_gradient_loss | -0.00041      |
|    value_loss           | 446           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1983          |
|    time_elapsed         | 1058

-----------------------------------------
| time/                   |             |
|    fps                  | 9           |
|    iterations           | 1993        |
|    time_elapsed         | 106297      |
|    total_timesteps      | 1020416     |
| train/                  |             |
|    approx_kl            | 0.000991188 |
|    clip_fraction        | 0.0186      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.225      |
|    explained_variance   | 0.828       |
|    learning_rate        | 1e-06       |
|    loss                 | 74.7        |
|    n_updates            | 19920       |
|    policy_gradient_loss | -0.00252    |
|    value_loss           | 159         |
-----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 1994          |
|    time_elapsed         | 106329        |
|    total_timesteps    

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2004         |
|    time_elapsed         | 106648       |
|    total_timesteps      | 1026048      |
| train/                  |              |
|    approx_kl            | 0.0003114913 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.2         |
|    explained_variance   | 0.629        |
|    learning_rate        | 1e-06        |
|    loss                 | 401          |
|    n_updates            | 20030        |
|    policy_gradient_loss | -0.000461    |
|    value_loss           | 904          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2005          |
|    time_elapsed         | 106678        |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2015          |
|    time_elapsed         | 106980        |
|    total_timesteps      | 1031680       |
| train/                  |               |
|    approx_kl            | 0.00020732323 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.294        |
|    explained_variance   | 0.722         |
|    learning_rate        | 1e-06         |
|    loss                 | 183           |
|    n_updates            | 20140         |
|    policy_gradient_loss | -0.000245     |
|    value_loss           | 348           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2016         |
|    time_elapsed         | 107016  

-----------------------------------------
| time/                   |             |
|    fps                  | 9           |
|    iterations           | 2026        |
|    time_elapsed         | 107383      |
|    total_timesteps      | 1037312     |
| train/                  |             |
|    approx_kl            | 0.001937068 |
|    clip_fraction        | 0.00723     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.327      |
|    explained_variance   | 0.475       |
|    learning_rate        | 1e-06       |
|    loss                 | 383         |
|    n_updates            | 20250       |
|    policy_gradient_loss | -0.00257    |
|    value_loss           | 565         |
-----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2027          |
|    time_elapsed         | 107412        |
|    total_timesteps    

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2037         |
|    time_elapsed         | 107716       |
|    total_timesteps      | 1042944      |
| train/                  |              |
|    approx_kl            | 3.256253e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.164       |
|    explained_variance   | 0.667        |
|    learning_rate        | 1e-06        |
|    loss                 | 426          |
|    n_updates            | 20360        |
|    policy_gradient_loss | -3.87e-06    |
|    value_loss           | 798          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2038         |
|    time_elapsed         | 107747       |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2048          |
|    time_elapsed         | 108064        |
|    total_timesteps      | 1048576       |
| train/                  |               |
|    approx_kl            | 0.00033828872 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.242        |
|    explained_variance   | 0.58          |
|    learning_rate        | 1e-06         |
|    loss                 | 169           |
|    n_updates            | 20470         |
|    policy_gradient_loss | -0.000322     |
|    value_loss           | 830           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2049         |
|    time_elapsed         | 108096  

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2059          |
|    time_elapsed         | 108451        |
|    total_timesteps      | 1054208       |
| train/                  |               |
|    approx_kl            | 0.00069231004 |
|    clip_fraction        | 0.00313       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.189        |
|    explained_variance   | 0.788         |
|    learning_rate        | 1e-06         |
|    loss                 | 97.7          |
|    n_updates            | 20580         |
|    policy_gradient_loss | -0.000337     |
|    value_loss           | 238           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2060          |
|    time_elapsed         | 1084

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2070         |
|    time_elapsed         | 108796       |
|    total_timesteps      | 1059840      |
| train/                  |              |
|    approx_kl            | 0.0011514401 |
|    clip_fraction        | 0.00488      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.258       |
|    explained_variance   | 0.604        |
|    learning_rate        | 1e-06        |
|    loss                 | 103          |
|    n_updates            | 20690        |
|    policy_gradient_loss | -0.000692    |
|    value_loss           | 254          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2071         |
|    time_elapsed         | 108826       |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2081          |
|    time_elapsed         | 109185        |
|    total_timesteps      | 1065472       |
| train/                  |               |
|    approx_kl            | 0.00080888264 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.341        |
|    explained_variance   | 0.885         |
|    learning_rate        | 1e-06         |
|    loss                 | 113           |
|    n_updates            | 20800         |
|    policy_gradient_loss | -0.000395     |
|    value_loss           | 218           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2082         |
|    time_elapsed         | 109223  

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2092         |
|    time_elapsed         | 109590       |
|    total_timesteps      | 1071104      |
| train/                  |              |
|    approx_kl            | 0.0005312901 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.76        |
|    explained_variance   | -0.688       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0906       |
|    n_updates            | 20910        |
|    policy_gradient_loss | -0.00131     |
|    value_loss           | 0.179        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2093         |
|    time_elapsed         | 109627       |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2103         |
|    time_elapsed         | 109995       |
|    total_timesteps      | 1076736      |
| train/                  |              |
|    approx_kl            | 0.0001230021 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.78        |
|    explained_variance   | 0.819        |
|    learning_rate        | 1e-06        |
|    loss                 | 81           |
|    n_updates            | 21020        |
|    policy_gradient_loss | -8.37e-05    |
|    value_loss           | 95.1         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2104         |
|    time_elapsed         | 110034       |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2114          |
|    time_elapsed         | 110397        |
|    total_timesteps      | 1082368       |
| train/                  |               |
|    approx_kl            | 0.00012998132 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.849        |
|    explained_variance   | 0.45          |
|    learning_rate        | 1e-06         |
|    loss                 | 0.501         |
|    n_updates            | 21130         |
|    policy_gradient_loss | -0.000109     |
|    value_loss           | 1.22          |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2115         |
|    time_elapsed         | 110437  

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2125          |
|    time_elapsed         | 110790        |
|    total_timesteps      | 1088000       |
| train/                  |               |
|    approx_kl            | 2.5135581e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.762        |
|    explained_variance   | 0.725         |
|    learning_rate        | 1e-06         |
|    loss                 | 68.2          |
|    n_updates            | 21240         |
|    policy_gradient_loss | -0.000247     |
|    value_loss           | 186           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2126          |
|    time_elapsed         | 1108

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2136         |
|    time_elapsed         | 111187       |
|    total_timesteps      | 1093632      |
| train/                  |              |
|    approx_kl            | 5.614641e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.651       |
|    explained_variance   | 0.755        |
|    learning_rate        | 1e-06        |
|    loss                 | 50.6         |
|    n_updates            | 21350        |
|    policy_gradient_loss | -0.000341    |
|    value_loss           | 73.5         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2137          |
|    time_elapsed         | 111224        |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2147         |
|    time_elapsed         | 111581       |
|    total_timesteps      | 1099264      |
| train/                  |              |
|    approx_kl            | 2.049876e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.609       |
|    explained_variance   | 0.914        |
|    learning_rate        | 1e-06        |
|    loss                 | 136          |
|    n_updates            | 21460        |
|    policy_gradient_loss | -6.65e-05    |
|    value_loss           | 245          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2148         |
|    time_elapsed         | 111617       |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2158          |
|    time_elapsed         | 111984        |
|    total_timesteps      | 1104896       |
| train/                  |               |
|    approx_kl            | 2.8392533e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.64         |
|    explained_variance   | 0.703         |
|    learning_rate        | 1e-06         |
|    loss                 | 88.6          |
|    n_updates            | 21570         |
|    policy_gradient_loss | 6.71e-05      |
|    value_loss           | 197           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2159          |
|    time_elapsed         | 1120

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2169         |
|    time_elapsed         | 112376       |
|    total_timesteps      | 1110528      |
| train/                  |              |
|    approx_kl            | 8.509657e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.67        |
|    explained_variance   | 0.928        |
|    learning_rate        | 1e-06        |
|    loss                 | 54.4         |
|    n_updates            | 21680        |
|    policy_gradient_loss | -0.00024     |
|    value_loss           | 161          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2170          |
|    time_elapsed         | 112411        |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2180         |
|    time_elapsed         | 112769       |
|    total_timesteps      | 1116160      |
| train/                  |              |
|    approx_kl            | 0.0008770786 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.657       |
|    explained_variance   | 0.443        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.751        |
|    n_updates            | 21790        |
|    policy_gradient_loss | -9.95e-05    |
|    value_loss           | 2.98         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2181         |
|    time_elapsed         | 112803       |
|    total_

-----------------------------------------
| time/                   |             |
|    fps                  | 9           |
|    iterations           | 2191        |
|    time_elapsed         | 113158      |
|    total_timesteps      | 1121792     |
| train/                  |             |
|    approx_kl            | 0.002049311 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.849      |
|    explained_variance   | -0.647      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.176       |
|    n_updates            | 21900       |
|    policy_gradient_loss | -0.00174    |
|    value_loss           | 1.04        |
-----------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 9           |
|    iterations           | 2192        |
|    time_elapsed         | 113194      |
|    total_timesteps      | 112230

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2202         |
|    time_elapsed         | 113544       |
|    total_timesteps      | 1127424      |
| train/                  |              |
|    approx_kl            | 0.0010988243 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.927       |
|    explained_variance   | -0.168       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.363        |
|    n_updates            | 22010        |
|    policy_gradient_loss | -0.000334    |
|    value_loss           | 1.42         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2203         |
|    time_elapsed         | 113581       |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2213          |
|    time_elapsed         | 113942        |
|    total_timesteps      | 1133056       |
| train/                  |               |
|    approx_kl            | 0.00025794178 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.885        |
|    explained_variance   | 0.919         |
|    learning_rate        | 1e-06         |
|    loss                 | 133           |
|    n_updates            | 22120         |
|    policy_gradient_loss | 0.00127       |
|    value_loss           | 234           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2214         |
|    time_elapsed         | 113977  

--------------------------------------------
| time/                   |                |
|    fps                  | 9              |
|    iterations           | 2224           |
|    time_elapsed         | 114349         |
|    total_timesteps      | 1138688        |
| train/                  |                |
|    approx_kl            | 0.000122067984 |
|    clip_fraction        | 0.000586       |
|    clip_range           | 0.2            |
|    entropy_loss         | -0.794         |
|    explained_variance   | 0.536          |
|    learning_rate        | 1e-06          |
|    loss                 | 1.15           |
|    n_updates            | 22230          |
|    policy_gradient_loss | -0.000636      |
|    value_loss           | 1.6            |
--------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2225          |
|    time_elap

------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2235         |
|    time_elapsed         | 114749       |
|    total_timesteps      | 1144320      |
| train/                  |              |
|    approx_kl            | 0.0004401697 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.748       |
|    explained_variance   | 0.55         |
|    learning_rate        | 1e-06        |
|    loss                 | 0.609        |
|    n_updates            | 22340        |
|    policy_gradient_loss | -0.00148     |
|    value_loss           | 1.59         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 9            |
|    iterations           | 2236         |
|    time_elapsed         | 114788       |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 9             |
|    iterations           | 2246          |
|    time_elapsed         | 115139        |
|    total_timesteps      | 1149952       |
| train/                  |               |
|    approx_kl            | 2.3851753e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.651        |
|    explained_variance   | 0.857         |
|    learning_rate        | 1e-06         |
|    loss                 | 60.3          |
|    n_updates            | 22450         |
|    policy_gradient_loss | 6.94e-05      |
|    value_loss           | 102           |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 9           |
|    iterations           | 2247        |
|    time_elapsed         | 115170      

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2257          |
|    time_elapsed         | 115534        |
|    total_timesteps      | 1155584       |
| train/                  |               |
|    approx_kl            | 3.4122728e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.57         |
|    explained_variance   | 0.845         |
|    learning_rate        | 1e-06         |
|    loss                 | 72.1          |
|    n_updates            | 22560         |
|    policy_gradient_loss | 2.94e-05      |
|    value_loss           | 300           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2258         |
|    time_elapsed         | 115570  

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2268          |
|    time_elapsed         | 115923        |
|    total_timesteps      | 1161216       |
| train/                  |               |
|    approx_kl            | 0.00014794688 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.507        |
|    explained_variance   | 0.771         |
|    learning_rate        | 1e-06         |
|    loss                 | 123           |
|    n_updates            | 22670         |
|    policy_gradient_loss | -0.000225     |
|    value_loss           | 180           |
-------------------------------------------
--------------------------------------------
| time/                   |                |
|    fps                  | 10             |
|    iterations           | 2269           |
|    time_elapsed         | 

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2279          |
|    time_elapsed         | 116312        |
|    total_timesteps      | 1166848       |
| train/                  |               |
|    approx_kl            | 4.2216852e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.442        |
|    explained_variance   | 0.407         |
|    learning_rate        | 1e-06         |
|    loss                 | 111           |
|    n_updates            | 22780         |
|    policy_gradient_loss | -2.6e-05      |
|    value_loss           | 885           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2280          |
|    time_elapsed         | 1163

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2290          |
|    time_elapsed         | 116695        |
|    total_timesteps      | 1172480       |
| train/                  |               |
|    approx_kl            | 0.00093779725 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.469        |
|    explained_variance   | 0.97          |
|    learning_rate        | 1e-06         |
|    loss                 | 56.8          |
|    n_updates            | 22890         |
|    policy_gradient_loss | -0.00114      |
|    value_loss           | 118           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2291          |
|    time_elapsed         | 1167

------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2301         |
|    time_elapsed         | 117078       |
|    total_timesteps      | 1178112      |
| train/                  |              |
|    approx_kl            | 7.308717e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.363       |
|    explained_variance   | 0.678        |
|    learning_rate        | 1e-06        |
|    loss                 | 628          |
|    n_updates            | 23000        |
|    policy_gradient_loss | -0.000159    |
|    value_loss           | 807          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2302          |
|    time_elapsed         | 117110        |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2312          |
|    time_elapsed         | 117414        |
|    total_timesteps      | 1183744       |
| train/                  |               |
|    approx_kl            | 1.7345534e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.435        |
|    explained_variance   | 0.773         |
|    learning_rate        | 1e-06         |
|    loss                 | 182           |
|    n_updates            | 23110         |
|    policy_gradient_loss | 1.69e-05      |
|    value_loss           | 276           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2313          |
|    time_elapsed         | 1174

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2323          |
|    time_elapsed         | 117741        |
|    total_timesteps      | 1189376       |
| train/                  |               |
|    approx_kl            | 1.1008349e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.391        |
|    explained_variance   | 0.789         |
|    learning_rate        | 1e-06         |
|    loss                 | 519           |
|    n_updates            | 23220         |
|    policy_gradient_loss | -4.65e-05     |
|    value_loss           | 784           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2324         |
|    time_elapsed         | 117769  

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2334          |
|    time_elapsed         | 118057        |
|    total_timesteps      | 1195008       |
| train/                  |               |
|    approx_kl            | 0.00017022074 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.355        |
|    explained_variance   | 0.853         |
|    learning_rate        | 1e-06         |
|    loss                 | 229           |
|    n_updates            | 23330         |
|    policy_gradient_loss | -0.000204     |
|    value_loss           | 497           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2335         |
|    time_elapsed         | 118088  

-----------------------------------------
| time/                   |             |
|    fps                  | 10          |
|    iterations           | 2345        |
|    time_elapsed         | 118392      |
|    total_timesteps      | 1200640     |
| train/                  |             |
|    approx_kl            | 5.11721e-05 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.305      |
|    explained_variance   | 0.859       |
|    learning_rate        | 1e-06       |
|    loss                 | 117         |
|    n_updates            | 23440       |
|    policy_gradient_loss | -7.91e-06   |
|    value_loss           | 283         |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2346         |
|    time_elapsed         | 118424       |
|    total_timesteps      | 1

------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2356         |
|    time_elapsed         | 118818       |
|    total_timesteps      | 1206272      |
| train/                  |              |
|    approx_kl            | 8.524163e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.362       |
|    explained_variance   | 0.41         |
|    learning_rate        | 1e-06        |
|    loss                 | 603          |
|    n_updates            | 23550        |
|    policy_gradient_loss | -2.48e-05    |
|    value_loss           | 1.16e+03     |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2357          |
|    time_elapsed         | 118859        |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2367          |
|    time_elapsed         | 119273        |
|    total_timesteps      | 1211904       |
| train/                  |               |
|    approx_kl            | 3.8672704e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.337        |
|    explained_variance   | 0.816         |
|    learning_rate        | 1e-06         |
|    loss                 | 357           |
|    n_updates            | 23660         |
|    policy_gradient_loss | -0.000101     |
|    value_loss           | 1.03e+03      |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2368         |
|    time_elapsed         | 119313  

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2378          |
|    time_elapsed         | 119727        |
|    total_timesteps      | 1217536       |
| train/                  |               |
|    approx_kl            | 0.00036357774 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.261        |
|    explained_variance   | 0.692         |
|    learning_rate        | 1e-06         |
|    loss                 | 283           |
|    n_updates            | 23770         |
|    policy_gradient_loss | -0.000417     |
|    value_loss           | 739           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2379         |
|    time_elapsed         | 119767  

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2389          |
|    time_elapsed         | 120152        |
|    total_timesteps      | 1223168       |
| train/                  |               |
|    approx_kl            | 0.00062981155 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.191        |
|    explained_variance   | 0.861         |
|    learning_rate        | 1e-06         |
|    loss                 | 129           |
|    n_updates            | 23880         |
|    policy_gradient_loss | -0.000411     |
|    value_loss           | 347           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2390         |
|    time_elapsed         | 120187  

------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2400         |
|    time_elapsed         | 120545       |
|    total_timesteps      | 1228800      |
| train/                  |              |
|    approx_kl            | 6.925443e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.257       |
|    explained_variance   | 0.8          |
|    learning_rate        | 1e-06        |
|    loss                 | 155          |
|    n_updates            | 23990        |
|    policy_gradient_loss | -0.000203    |
|    value_loss           | 268          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2401         |
|    time_elapsed         | 120583       |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2411          |
|    time_elapsed         | 120907        |
|    total_timesteps      | 1234432       |
| train/                  |               |
|    approx_kl            | 0.00041711912 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.242        |
|    explained_variance   | 0.671         |
|    learning_rate        | 1e-06         |
|    loss                 | 122           |
|    n_updates            | 24100         |
|    policy_gradient_loss | -0.000615     |
|    value_loss           | 284           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2412         |
|    time_elapsed         | 120936  

------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2422         |
|    time_elapsed         | 121234       |
|    total_timesteps      | 1240064      |
| train/                  |              |
|    approx_kl            | 9.733369e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.297       |
|    explained_variance   | 0.638        |
|    learning_rate        | 1e-06        |
|    loss                 | 286          |
|    n_updates            | 24210        |
|    policy_gradient_loss | 0.000193     |
|    value_loss           | 901          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2423          |
|    time_elapsed         | 121265        |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2433          |
|    time_elapsed         | 121649        |
|    total_timesteps      | 1245696       |
| train/                  |               |
|    approx_kl            | 7.0539536e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.194        |
|    explained_variance   | 0.837         |
|    learning_rate        | 1e-06         |
|    loss                 | 162           |
|    n_updates            | 24320         |
|    policy_gradient_loss | -0.000189     |
|    value_loss           | 401           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2434         |
|    time_elapsed         | 121694  

-----------------------------------------
| time/                   |             |
|    fps                  | 10          |
|    iterations           | 2444        |
|    time_elapsed         | 122009      |
|    total_timesteps      | 1251328     |
| train/                  |             |
|    approx_kl            | 0.000423264 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.244      |
|    explained_variance   | 0.527       |
|    learning_rate        | 1e-06       |
|    loss                 | 82.1        |
|    n_updates            | 24430       |
|    policy_gradient_loss | -0.000189   |
|    value_loss           | 660         |
-----------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 10          |
|    iterations           | 2445        |
|    time_elapsed         | 122039      |
|    total_timesteps      | 125184

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2455          |
|    time_elapsed         | 122348        |
|    total_timesteps      | 1256960       |
| train/                  |               |
|    approx_kl            | 0.00079835113 |
|    clip_fraction        | 0.000391      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.224        |
|    explained_variance   | 0.521         |
|    learning_rate        | 1e-06         |
|    loss                 | 302           |
|    n_updates            | 24540         |
|    policy_gradient_loss | -0.0011       |
|    value_loss           | 908           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2456         |
|    time_elapsed         | 122378  

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2466          |
|    time_elapsed         | 122709        |
|    total_timesteps      | 1262592       |
| train/                  |               |
|    approx_kl            | 0.00031895167 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.253        |
|    explained_variance   | 0.765         |
|    learning_rate        | 1e-06         |
|    loss                 | 74.3          |
|    n_updates            | 24650         |
|    policy_gradient_loss | -0.000595     |
|    value_loss           | 274           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2467         |
|    time_elapsed         | 122741  

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2477          |
|    time_elapsed         | 123070        |
|    total_timesteps      | 1268224       |
| train/                  |               |
|    approx_kl            | 0.00035193504 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.318        |
|    explained_variance   | 0.833         |
|    learning_rate        | 1e-06         |
|    loss                 | 50.2          |
|    n_updates            | 24760         |
|    policy_gradient_loss | -0.000602     |
|    value_loss           | 185           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2478         |
|    time_elapsed         | 123104  

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2488          |
|    time_elapsed         | 123420        |
|    total_timesteps      | 1273856       |
| train/                  |               |
|    approx_kl            | 1.5588012e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.385        |
|    explained_variance   | 0.571         |
|    learning_rate        | 1e-06         |
|    loss                 | 731           |
|    n_updates            | 24870         |
|    policy_gradient_loss | 5.39e-05      |
|    value_loss           | 953           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2489          |
|    time_elapsed         | 1234

------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2499         |
|    time_elapsed         | 123809       |
|    total_timesteps      | 1279488      |
| train/                  |              |
|    approx_kl            | 0.0009192389 |
|    clip_fraction        | 0.0041       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.248       |
|    explained_variance   | 0.916        |
|    learning_rate        | 1e-06        |
|    loss                 | 149          |
|    n_updates            | 24980        |
|    policy_gradient_loss | -0.0019      |
|    value_loss           | 265          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2500          |
|    time_elapsed         | 123848        |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2510          |
|    time_elapsed         | 124203        |
|    total_timesteps      | 1285120       |
| train/                  |               |
|    approx_kl            | 4.6315836e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.175        |
|    explained_variance   | 0.766         |
|    learning_rate        | 1e-06         |
|    loss                 | 413           |
|    n_updates            | 25090         |
|    policy_gradient_loss | -6.6e-06      |
|    value_loss           | 529           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2511          |
|    time_elapsed         | 1242

------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2521         |
|    time_elapsed         | 124590       |
|    total_timesteps      | 1290752      |
| train/                  |              |
|    approx_kl            | 0.0002901731 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.175       |
|    explained_variance   | 0.838        |
|    learning_rate        | 1e-06        |
|    loss                 | 56.2         |
|    n_updates            | 25200        |
|    policy_gradient_loss | -0.000366    |
|    value_loss           | 141          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2522          |
|    time_elapsed         | 124624        |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2532          |
|    time_elapsed         | 124978        |
|    total_timesteps      | 1296384       |
| train/                  |               |
|    approx_kl            | 0.00050159695 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.261        |
|    explained_variance   | 0.698         |
|    learning_rate        | 1e-06         |
|    loss                 | 144           |
|    n_updates            | 25310         |
|    policy_gradient_loss | -0.00064      |
|    value_loss           | 277           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2533         |
|    time_elapsed         | 125015  

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2543          |
|    time_elapsed         | 125375        |
|    total_timesteps      | 1302016       |
| train/                  |               |
|    approx_kl            | 1.4951336e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.32         |
|    explained_variance   | 0.192         |
|    learning_rate        | 1e-06         |
|    loss                 | 214           |
|    n_updates            | 25420         |
|    policy_gradient_loss | -2.77e-05     |
|    value_loss           | 1.02e+03      |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2544          |
|    time_elapsed         | 1254

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2554          |
|    time_elapsed         | 125759        |
|    total_timesteps      | 1307648       |
| train/                  |               |
|    approx_kl            | 5.1377807e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.214        |
|    explained_variance   | 0.678         |
|    learning_rate        | 1e-06         |
|    loss                 | 151           |
|    n_updates            | 25530         |
|    policy_gradient_loss | -3.05e-05     |
|    value_loss           | 630           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2555         |
|    time_elapsed         | 125796  

------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2565         |
|    time_elapsed         | 126145       |
|    total_timesteps      | 1313280      |
| train/                  |              |
|    approx_kl            | 0.0007910774 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.303       |
|    explained_variance   | 0.814        |
|    learning_rate        | 1e-06        |
|    loss                 | 152          |
|    n_updates            | 25640        |
|    policy_gradient_loss | -0.000657    |
|    value_loss           | 308          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2566          |
|    time_elapsed         | 126184        |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2576          |
|    time_elapsed         | 126543        |
|    total_timesteps      | 1318912       |
| train/                  |               |
|    approx_kl            | 0.00029317732 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.271        |
|    explained_variance   | 0.803         |
|    learning_rate        | 1e-06         |
|    loss                 | 155           |
|    n_updates            | 25750         |
|    policy_gradient_loss | -0.000489     |
|    value_loss           | 314           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2577         |
|    time_elapsed         | 126577  

----------------------------------------
| time/                   |            |
|    fps                  | 10         |
|    iterations           | 2587       |
|    time_elapsed         | 126949     |
|    total_timesteps      | 1324544    |
| train/                  |            |
|    approx_kl            | 0.00803658 |
|    clip_fraction        | 0.0619     |
|    clip_range           | 0.2        |
|    entropy_loss         | -1.52      |
|    explained_variance   | 0.568      |
|    learning_rate        | 1e-06      |
|    loss                 | 169        |
|    n_updates            | 25860      |
|    policy_gradient_loss | 0.00346    |
|    value_loss           | 552        |
----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2588         |
|    time_elapsed         | 126986       |
|    total_timesteps      | 1325056      |
| tr

---------------------------------------
| time/                   |           |
|    fps                  | 10        |
|    iterations           | 2598      |
|    time_elapsed         | 127308    |
|    total_timesteps      | 1330176   |
| train/                  |           |
|    approx_kl            | 0.0002455 |
|    clip_fraction        | 0         |
|    clip_range           | 0.2       |
|    entropy_loss         | -1.67     |
|    explained_variance   | -0.284    |
|    learning_rate        | 1e-06     |
|    loss                 | 0.187     |
|    n_updates            | 25970     |
|    policy_gradient_loss | -0.000944 |
|    value_loss           | 0.49      |
---------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2599          |
|    time_elapsed         | 127339        |
|    total_timesteps      | 1330688       |
| train/        

-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2609          |
|    time_elapsed         | 127660        |
|    total_timesteps      | 1335808       |
| train/                  |               |
|    approx_kl            | 0.00012349314 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.197        |
|    explained_variance   | 0.844         |
|    learning_rate        | 1e-06         |
|    loss                 | 102           |
|    n_updates            | 26080         |
|    policy_gradient_loss | -0.000322     |
|    value_loss           | 201           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2610          |
|    time_elapsed         | 1276

------------------------------------------
| time/                   |              |
|    fps                  | 10           |
|    iterations           | 2620         |
|    time_elapsed         | 128022       |
|    total_timesteps      | 1341440      |
| train/                  |              |
|    approx_kl            | 7.295166e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.276       |
|    explained_variance   | 0.69         |
|    learning_rate        | 1e-06        |
|    loss                 | 646          |
|    n_updates            | 26190        |
|    policy_gradient_loss | 1.93e-05     |
|    value_loss           | 668          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 10            |
|    iterations           | 2621          |
|    time_elapsed         | 128054        |
|    t

# 4. Test

In [5]:
# Load model
model = PPO.load('./train/best_model_1300000')

In [6]:
# Start the game 
state = env.reset()
# Loop through the game
while True: 
    action, _ = model.predict(state)
    state, reward, done, info = env.step(action)
    env.render()

  return (self.ram[0x86] - self.ram[0x071c]) % 256


KeyboardInterrupt: 

In [7]:
env.close()