In [None]:
!pip install gym_super_mario_bros==7.3.0 nes_py

In [3]:
# Import the game
import gym_super_mario_bros
# Import the Joypad wrapper
from nes_py.wrappers import JoypadSpace
# Import the SIMPLIFIED controls
from gym_super_mario_bros.actions import SIMPLE_MOVEMENT

In [4]:
# Setup game
#env = gym_super_mario_bros.make('SuperMarioBros-v0')
#env = JoypadSpace(env, SIMPLE_MOVEMENT)

In [5]:
#done = True
#for step in range(100000):
#    if done:
#        env.reset()
#    state, reward, done, info = env.step(env.action_space.sample())
#    env.render()

#env.close()

In [None]:
!pip install torch torchvision torchaudio --extra-index-url https://download.pytorch.org/whl/cu117

In [None]:
!pip install stable-baselines3[extra]

In [6]:
from gym.wrappers import FrameStack, GrayScaleObservation

from stable_baselines3.common.vec_env import VecFrameStack, DummyVecEnv

from matplotlib import pyplot as plt

In [7]:
# Create base environment
env = gym_super_mario_bros.make('SuperMarioBros-v0')
# Simplify Controls
env = JoypadSpace(env, SIMPLE_MOVEMENT)
# Grayscale
env = GrayScaleObservation(env, keep_dim=True)
# Format it for the AI to understand
env = DummyVecEnv([lambda: env])
# Stack the frames
env = VecFrameStack(env, 4, channels_order='last')

In [8]:
# Import os file for path management
import os
# import PPO for algos
from stable_baselines3 import PPO
# Import Base Callback for saving models
from stable_baselines3.common.callbacks import BaseCallback

In [6]:
class TrainAndLoggingCallback(BaseCallback):

    def __init__(self, check_freq, save_path, verbose=1):
        super(TrainAndLoggingCallback, self).__init__(verbose)
        self.check_freq = check_freq
        self.save_path = save_path

    def _init_callback(self):
        if self.save_path is not None:
            os.makedirs(self.save_path, exist_ok=True)

    def _on_step(self):
        if self.n_calls % self.check_freq == 0:
            model_path = os.path.join(self.save_path, 'best_model_{}'.format(self.n_calls))
            self.model.save(model_path)

        return True

In [7]:
CHECKPOINT_DIR = './train/'
LOG_DIR = './logs/'

In [9]:
# Setup model saving callback
callback = TrainAndLoggingCallback(check_freq=20000, save_path=CHECKPOINT_DIR)

In [10]:
# This is the AI model started
model = PPO('CnnPolicy', env, verbose=1, tensorboard_log=LOG_DIR, learning_rate=0.000001, 
            n_steps=512) 

Using cuda device
Wrapping the env in a VecTransposeImage.


In [11]:
# Train the AI model, this is where the AI model starts to learn
model.learn(total_timesteps=1000000, callback=callback)

Logging to ./logs/PPO_2


  return (self.ram[0x86] - self.ram[0x071c]) % 256


----------------------------
| time/              |     |
|    fps             | 110 |
|    iterations      | 1   |
|    time_elapsed    | 4   |
|    total_timesteps | 512 |
----------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 94           |
|    iterations           | 2            |
|    time_elapsed         | 10           |
|    total_timesteps      | 1024         |
| train/                  |              |
|    approx_kl            | 4.520756e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.95        |
|    explained_variance   | -0.00399     |
|    learning_rate        | 1e-06        |
|    loss                 | 76.7         |
|    n_updates            | 10           |
|    policy_gradient_loss | 3.66e-05     |
|    value_loss           | 236          |
------------------------------------------
-----------------------

-------------------------------------------
| time/                   |               |
|    fps                  | 86            |
|    iterations           | 13            |
|    time_elapsed         | 76            |
|    total_timesteps      | 6656          |
| train/                  |               |
|    approx_kl            | 1.4020596e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.95         |
|    explained_variance   | 0.00674       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0968        |
|    n_updates            | 120           |
|    policy_gradient_loss | -0.000286     |
|    value_loss           | 0.173         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 86           |
|    iterations           | 14           |
|    time_elapsed         | 82      

------------------------------------------
| time/                   |              |
|    fps                  | 86           |
|    iterations           | 24           |
|    time_elapsed         | 142          |
|    total_timesteps      | 12288        |
| train/                  |              |
|    approx_kl            | 3.357744e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | -0.0464      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0868       |
|    n_updates            | 230          |
|    policy_gradient_loss | -0.000178    |
|    value_loss           | 1.05         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 85           |
|    iterations           | 25           |
|    time_elapsed         | 148          |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 85           |
|    iterations           | 35           |
|    time_elapsed         | 209          |
|    total_timesteps      | 17920        |
| train/                  |              |
|    approx_kl            | 7.254549e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.94        |
|    explained_variance   | 0.0107       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0697       |
|    n_updates            | 340          |
|    policy_gradient_loss | -0.000753    |
|    value_loss           | 0.159        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 85           |
|    iterations           | 36           |
|    time_elapsed         | 214          |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 85            |
|    iterations           | 46            |
|    time_elapsed         | 275           |
|    total_timesteps      | 23552         |
| train/                  |               |
|    approx_kl            | 1.8970459e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.94         |
|    explained_variance   | -0.0134       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.217         |
|    n_updates            | 450           |
|    policy_gradient_loss | -0.000201     |
|    value_loss           | 0.385         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 85           |
|    iterations           | 47           |
|    time_elapsed         | 281     

-------------------------------------------
| time/                   |               |
|    fps                  | 85            |
|    iterations           | 57            |
|    time_elapsed         | 341           |
|    total_timesteps      | 29184         |
| train/                  |               |
|    approx_kl            | 0.00013472012 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.93         |
|    explained_variance   | 0.0615        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0583        |
|    n_updates            | 560           |
|    policy_gradient_loss | -0.0014       |
|    value_loss           | 0.135         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 85            |
|    iterations           | 58            |
|    time_elapsed         | 347 

-------------------------------------------
| time/                   |               |
|    fps                  | 85            |
|    iterations           | 68            |
|    time_elapsed         | 409           |
|    total_timesteps      | 34816         |
| train/                  |               |
|    approx_kl            | 2.4474692e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.92         |
|    explained_variance   | 0.0934        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0462        |
|    n_updates            | 670           |
|    policy_gradient_loss | -0.000199     |
|    value_loss           | 0.116         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 85            |
|    iterations           | 69            |
|    time_elapsed         | 414 

-----------------------------------------
| time/                   |             |
|    fps                  | 84          |
|    iterations           | 79          |
|    time_elapsed         | 475         |
|    total_timesteps      | 40448       |
| train/                  |             |
|    approx_kl            | 0.001262655 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.9        |
|    explained_variance   | 0.101       |
|    learning_rate        | 1e-06       |
|    loss                 | 117         |
|    n_updates            | 780         |
|    policy_gradient_loss | -5.09e-05   |
|    value_loss           | 336         |
-----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 84            |
|    iterations           | 80            |
|    time_elapsed         | 482           |
|    total_timesteps    

------------------------------------------
| time/                   |              |
|    fps                  | 84           |
|    iterations           | 90           |
|    time_elapsed         | 544          |
|    total_timesteps      | 46080        |
| train/                  |              |
|    approx_kl            | 0.0001477499 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.9         |
|    explained_variance   | 0.0667       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0616       |
|    n_updates            | 890          |
|    policy_gradient_loss | -0.000918    |
|    value_loss           | 0.165        |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 84          |
|    iterations           | 91          |
|    time_elapsed         | 550         |
|    total_times

------------------------------------------
| time/                   |              |
|    fps                  | 84           |
|    iterations           | 101          |
|    time_elapsed         | 611          |
|    total_timesteps      | 51712        |
| train/                  |              |
|    approx_kl            | 9.936222e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.0223       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.067        |
|    n_updates            | 1000         |
|    policy_gradient_loss | -0.000447    |
|    value_loss           | 0.701        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 84            |
|    iterations           | 102           |
|    time_elapsed         | 618           |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 84            |
|    iterations           | 112           |
|    time_elapsed         | 679           |
|    total_timesteps      | 57344         |
| train/                  |               |
|    approx_kl            | 0.00011413684 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.89         |
|    explained_variance   | -0.0794       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0354        |
|    n_updates            | 1110          |
|    policy_gradient_loss | -0.000593     |
|    value_loss           | 0.0998        |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 84            |
|    iterations           | 113           |
|    time_elapsed         | 685 

------------------------------------------
| time/                   |              |
|    fps                  | 84           |
|    iterations           | 123          |
|    time_elapsed         | 747          |
|    total_timesteps      | 62976        |
| train/                  |              |
|    approx_kl            | 5.141995e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.89        |
|    explained_variance   | 0.0228       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0873       |
|    n_updates            | 1220         |
|    policy_gradient_loss | -0.000187    |
|    value_loss           | 0.47         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 84            |
|    iterations           | 124           |
|    time_elapsed         | 754           |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 134          |
|    time_elapsed         | 817          |
|    total_timesteps      | 68608        |
| train/                  |              |
|    approx_kl            | 7.271848e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.88        |
|    explained_variance   | 0.0657       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0531       |
|    n_updates            | 1330         |
|    policy_gradient_loss | -0.000397    |
|    value_loss           | 0.137        |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 83          |
|    iterations           | 135         |
|    time_elapsed         | 824         |
|    total_times

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 145           |
|    time_elapsed         | 886           |
|    total_timesteps      | 74240         |
| train/                  |               |
|    approx_kl            | 3.9319042e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | -0.0692       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.696         |
|    n_updates            | 1440          |
|    policy_gradient_loss | -0.000149     |
|    value_loss           | 1.57          |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 83          |
|    iterations           | 146         |
|    time_elapsed         | 893         

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 156           |
|    time_elapsed         | 955           |
|    total_timesteps      | 79872         |
| train/                  |               |
|    approx_kl            | 6.4404914e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.83         |
|    explained_variance   | 0.0195        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0863        |
|    n_updates            | 1550          |
|    policy_gradient_loss | -2.83e-05     |
|    value_loss           | 0.592         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 157           |
|    time_elapsed         | 962 

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 167           |
|    time_elapsed         | 1026          |
|    total_timesteps      | 85504         |
| train/                  |               |
|    approx_kl            | 0.00011920871 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.82         |
|    explained_variance   | -0.0176       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0549        |
|    n_updates            | 1660          |
|    policy_gradient_loss | -0.000358     |
|    value_loss           | 0.299         |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 83          |
|    iterations           | 168         |
|    time_elapsed         | 1032        

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 178          |
|    time_elapsed         | 1093         |
|    total_timesteps      | 91136        |
| train/                  |              |
|    approx_kl            | 9.993673e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.79        |
|    explained_variance   | 0.046        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.133        |
|    n_updates            | 1770         |
|    policy_gradient_loss | -0.000118    |
|    value_loss           | 0.442        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 179          |
|    time_elapsed         | 1099         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 189           |
|    time_elapsed         | 1160          |
|    total_timesteps      | 96768         |
| train/                  |               |
|    approx_kl            | 0.00018417288 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.78         |
|    explained_variance   | 0.11          |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0422        |
|    n_updates            | 1880          |
|    policy_gradient_loss | -0.000647     |
|    value_loss           | 0.0825        |
-------------------------------------------
--------------------------------------------
| time/                   |                |
|    fps                  | 83             |
|    iterations           | 190            |
|    time_elapsed         | 

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 200           |
|    time_elapsed         | 1230          |
|    total_timesteps      | 102400        |
| train/                  |               |
|    approx_kl            | 0.00012532668 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.75         |
|    explained_variance   | 0.0858        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.067         |
|    n_updates            | 1990          |
|    policy_gradient_loss | -0.000511     |
|    value_loss           | 0.248         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 201           |
|    time_elapsed         | 1236

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 211          |
|    time_elapsed         | 1300         |
|    total_timesteps      | 108032       |
| train/                  |              |
|    approx_kl            | 0.0008985391 |
|    clip_fraction        | 0.000195     |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.72        |
|    explained_variance   | 0.627        |
|    learning_rate        | 1e-06        |
|    loss                 | 40           |
|    n_updates            | 2100         |
|    policy_gradient_loss | -0.000121    |
|    value_loss           | 87.2         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 212           |
|    time_elapsed         | 1306          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 82            |
|    iterations           | 222           |
|    time_elapsed         | 1370          |
|    total_timesteps      | 113664        |
| train/                  |               |
|    approx_kl            | 0.00090776396 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.72         |
|    explained_variance   | 0.01          |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0416        |
|    n_updates            | 2210          |
|    policy_gradient_loss | -0.00244      |
|    value_loss           | 0.0965        |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 82           |
|    iterations           | 223          |
|    time_elapsed         | 1376    

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 233          |
|    time_elapsed         | 1437         |
|    total_timesteps      | 119296       |
| train/                  |              |
|    approx_kl            | 0.0003176449 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.71        |
|    explained_variance   | -0.0348      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0953       |
|    n_updates            | 2320         |
|    policy_gradient_loss | -0.00134     |
|    value_loss           | 0.391        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 234           |
|    time_elapsed         | 1443          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 82            |
|    iterations           | 244           |
|    time_elapsed         | 1507          |
|    total_timesteps      | 124928        |
| train/                  |               |
|    approx_kl            | 0.00047528965 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.75         |
|    explained_variance   | -0.0502       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0397        |
|    n_updates            | 2430          |
|    policy_gradient_loss | -0.0014       |
|    value_loss           | 0.0928        |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 82            |
|    iterations           | 245           |
|    time_elapsed         | 1513

-------------------------------------------
| time/                   |               |
|    fps                  | 82            |
|    iterations           | 255           |
|    time_elapsed         | 1574          |
|    total_timesteps      | 130560        |
| train/                  |               |
|    approx_kl            | 0.00037921453 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.73         |
|    explained_variance   | 0.0788        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0498        |
|    n_updates            | 2540          |
|    policy_gradient_loss | -0.00144      |
|    value_loss           | 0.127         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 82            |
|    iterations           | 256           |
|    time_elapsed         | 1580

------------------------------------------
| time/                   |              |
|    fps                  | 82           |
|    iterations           | 266          |
|    time_elapsed         | 1641         |
|    total_timesteps      | 136192       |
| train/                  |              |
|    approx_kl            | 0.0007735945 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.72        |
|    explained_variance   | 0.108        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0354       |
|    n_updates            | 2650         |
|    policy_gradient_loss | -0.00229     |
|    value_loss           | 0.0821       |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 82           |
|    iterations           | 267          |
|    time_elapsed         | 1647         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 82           |
|    iterations           | 277          |
|    time_elapsed         | 1709         |
|    total_timesteps      | 141824       |
| train/                  |              |
|    approx_kl            | 0.0008586686 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.6         |
|    explained_variance   | 0.578        |
|    learning_rate        | 1e-06        |
|    loss                 | 88.4         |
|    n_updates            | 2760         |
|    policy_gradient_loss | -0.00118     |
|    value_loss           | 201          |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 82          |
|    iterations           | 278         |
|    time_elapsed         | 1715        |
|    total_times

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 288          |
|    time_elapsed         | 1775         |
|    total_timesteps      | 147456       |
| train/                  |              |
|    approx_kl            | 8.278072e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.64        |
|    explained_variance   | 0.0729       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0518       |
|    n_updates            | 2870         |
|    policy_gradient_loss | -0.000164    |
|    value_loss           | 0.241        |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 83          |
|    iterations           | 289         |
|    time_elapsed         | 1781        |
|    total_times

--------------------------------------------
| time/                   |                |
|    fps                  | 83             |
|    iterations           | 299            |
|    time_elapsed         | 1841           |
|    total_timesteps      | 153088         |
| train/                  |                |
|    approx_kl            | 0.000111211324 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -1.54          |
|    explained_variance   | 0.212          |
|    learning_rate        | 1e-06          |
|    loss                 | 0.169          |
|    n_updates            | 2980           |
|    policy_gradient_loss | 0.000123       |
|    value_loss           | 1.94           |
--------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 300          |
|    time_elapsed 

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 310           |
|    time_elapsed         | 1906          |
|    total_timesteps      | 158720        |
| train/                  |               |
|    approx_kl            | 0.00079291733 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.42         |
|    explained_variance   | 0.264         |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0494        |
|    n_updates            | 3090          |
|    policy_gradient_loss | -0.0011       |
|    value_loss           | 0.109         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 311          |
|    time_elapsed         | 1912    

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 321          |
|    time_elapsed         | 1973         |
|    total_timesteps      | 164352       |
| train/                  |              |
|    approx_kl            | 0.0005034901 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.19        |
|    explained_variance   | 0.00324      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.185        |
|    n_updates            | 3200         |
|    policy_gradient_loss | -0.000671    |
|    value_loss           | 1.9          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 322          |
|    time_elapsed         | 1979         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 332          |
|    time_elapsed         | 2039         |
|    total_timesteps      | 169984       |
| train/                  |              |
|    approx_kl            | 0.0001846049 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.939       |
|    explained_variance   | 0.0363       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0839       |
|    n_updates            | 3310         |
|    policy_gradient_loss | 0.000536     |
|    value_loss           | 3.51         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 333           |
|    time_elapsed         | 2045          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 343          |
|    time_elapsed         | 2106         |
|    total_timesteps      | 175616       |
| train/                  |              |
|    approx_kl            | 0.0009342914 |
|    clip_fraction        | 0.00176      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.391       |
|    explained_variance   | 0.406        |
|    learning_rate        | 1e-06        |
|    loss                 | 106          |
|    n_updates            | 3420         |
|    policy_gradient_loss | 0.00125      |
|    value_loss           | 269          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 344           |
|    time_elapsed         | 2112          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 354           |
|    time_elapsed         | 2175          |
|    total_timesteps      | 181248        |
| train/                  |               |
|    approx_kl            | 0.00013294746 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.247        |
|    explained_variance   | 0.667         |
|    learning_rate        | 1e-06         |
|    loss                 | 100           |
|    n_updates            | 3530          |
|    policy_gradient_loss | -0.000223     |
|    value_loss           | 222           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 355           |
|    time_elapsed         | 2181

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 365           |
|    time_elapsed         | 2242          |
|    total_timesteps      | 186880        |
| train/                  |               |
|    approx_kl            | 1.0254793e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.219        |
|    explained_variance   | 0.19          |
|    learning_rate        | 1e-06         |
|    loss                 | 360           |
|    n_updates            | 3640          |
|    policy_gradient_loss | -0.000199     |
|    value_loss           | 497           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 366          |
|    time_elapsed         | 2249    

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 376           |
|    time_elapsed         | 2310          |
|    total_timesteps      | 192512        |
| train/                  |               |
|    approx_kl            | 0.00014733081 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.218        |
|    explained_variance   | 0.0514        |
|    learning_rate        | 1e-06         |
|    loss                 | 489           |
|    n_updates            | 3750          |
|    policy_gradient_loss | -0.000796     |
|    value_loss           | 696           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 377          |
|    time_elapsed         | 2316    

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 387           |
|    time_elapsed         | 2376          |
|    total_timesteps      | 198144        |
| train/                  |               |
|    approx_kl            | 9.3373936e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.261        |
|    explained_variance   | 0.265         |
|    learning_rate        | 1e-06         |
|    loss                 | 264           |
|    n_updates            | 3860          |
|    policy_gradient_loss | -0.000293     |
|    value_loss           | 532           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 388           |
|    time_elapsed         | 2382

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 398           |
|    time_elapsed         | 2444          |
|    total_timesteps      | 203776        |
| train/                  |               |
|    approx_kl            | 0.00011613686 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.21         |
|    explained_variance   | 0.258         |
|    learning_rate        | 1e-06         |
|    loss                 | 229           |
|    n_updates            | 3970          |
|    policy_gradient_loss | -0.000176     |
|    value_loss           | 465           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 399           |
|    time_elapsed         | 2451

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 409           |
|    time_elapsed         | 2511          |
|    total_timesteps      | 209408        |
| train/                  |               |
|    approx_kl            | 0.00023770891 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.2          |
|    explained_variance   | 0.242         |
|    learning_rate        | 1e-06         |
|    loss                 | 73.4          |
|    n_updates            | 4080          |
|    policy_gradient_loss | -0.000697     |
|    value_loss           | 568           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 410           |
|    time_elapsed         | 2517

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 420           |
|    time_elapsed         | 2576          |
|    total_timesteps      | 215040        |
| train/                  |               |
|    approx_kl            | 0.00036483782 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.21         |
|    explained_variance   | 0.305         |
|    learning_rate        | 1e-06         |
|    loss                 | 489           |
|    n_updates            | 4190          |
|    policy_gradient_loss | -0.000166     |
|    value_loss           | 573           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 421           |
|    time_elapsed         | 2582

-----------------------------------------
| time/                   |             |
|    fps                  | 83          |
|    iterations           | 431         |
|    time_elapsed         | 2644        |
|    total_timesteps      | 220672      |
| train/                  |             |
|    approx_kl            | 0.000635157 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.427      |
|    explained_variance   | 0.76        |
|    learning_rate        | 1e-06       |
|    loss                 | 107         |
|    n_updates            | 4300        |
|    policy_gradient_loss | -0.0011     |
|    value_loss           | 235         |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 432          |
|    time_elapsed         | 2650         |
|    total_timesteps      | 2

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 442          |
|    time_elapsed         | 2711         |
|    total_timesteps      | 226304       |
| train/                  |              |
|    approx_kl            | 0.0001517348 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.392       |
|    explained_variance   | 0.782        |
|    learning_rate        | 1e-06        |
|    loss                 | 93.6         |
|    n_updates            | 4410         |
|    policy_gradient_loss | -0.000734    |
|    value_loss           | 236          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 443          |
|    time_elapsed         | 2717         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 453           |
|    time_elapsed         | 2777          |
|    total_timesteps      | 231936        |
| train/                  |               |
|    approx_kl            | 4.3641892e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.237        |
|    explained_variance   | 0.228         |
|    learning_rate        | 1e-06         |
|    loss                 | 420           |
|    n_updates            | 4520          |
|    policy_gradient_loss | 0.000548      |
|    value_loss           | 696           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 454           |
|    time_elapsed         | 2783

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 464           |
|    time_elapsed         | 2848          |
|    total_timesteps      | 237568        |
| train/                  |               |
|    approx_kl            | 0.00076896406 |
|    clip_fraction        | 0.000781      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.353        |
|    explained_variance   | 0.583         |
|    learning_rate        | 1e-06         |
|    loss                 | 320           |
|    n_updates            | 4630          |
|    policy_gradient_loss | 4.75e-05      |
|    value_loss           | 517           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 465           |
|    time_elapsed         | 2854

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 475           |
|    time_elapsed         | 2916          |
|    total_timesteps      | 243200        |
| train/                  |               |
|    approx_kl            | 0.00023666548 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.301        |
|    explained_variance   | 0.489         |
|    learning_rate        | 1e-06         |
|    loss                 | 128           |
|    n_updates            | 4740          |
|    policy_gradient_loss | -0.000872     |
|    value_loss           | 283           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 476           |
|    time_elapsed         | 2922

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 486           |
|    time_elapsed         | 2983          |
|    total_timesteps      | 248832        |
| train/                  |               |
|    approx_kl            | 0.00021000498 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.25         |
|    explained_variance   | 0.417         |
|    learning_rate        | 1e-06         |
|    loss                 | 51            |
|    n_updates            | 4850          |
|    policy_gradient_loss | -0.00035      |
|    value_loss           | 136           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 487           |
|    time_elapsed         | 2990

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 497           |
|    time_elapsed         | 3051          |
|    total_timesteps      | 254464        |
| train/                  |               |
|    approx_kl            | 0.00046728575 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.344        |
|    explained_variance   | 0.613         |
|    learning_rate        | 1e-06         |
|    loss                 | 293           |
|    n_updates            | 4960          |
|    policy_gradient_loss | -0.000617     |
|    value_loss           | 520           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 498          |
|    time_elapsed         | 3056    

------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 508          |
|    time_elapsed         | 3120         |
|    total_timesteps      | 260096       |
| train/                  |              |
|    approx_kl            | 0.0047663767 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.77        |
|    explained_variance   | -4.04        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.237        |
|    n_updates            | 5070         |
|    policy_gradient_loss | -0.00381     |
|    value_loss           | 1.22         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 509          |
|    time_elapsed         | 3126         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 519           |
|    time_elapsed         | 3186          |
|    total_timesteps      | 265728        |
| train/                  |               |
|    approx_kl            | 0.00030821806 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.86         |
|    explained_variance   | 0.00628       |
|    learning_rate        | 1e-06         |
|    loss                 | 0.0493        |
|    n_updates            | 5180          |
|    policy_gradient_loss | -0.000627     |
|    value_loss           | 0.417         |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 520           |
|    time_elapsed         | 3191

---------------------------------------
| time/                   |           |
|    fps                  | 83        |
|    iterations           | 530       |
|    time_elapsed         | 3255      |
|    total_timesteps      | 271360    |
| train/                  |           |
|    approx_kl            | 0.0120095 |
|    clip_fraction        | 0.00684   |
|    clip_range           | 0.2       |
|    entropy_loss         | -1.48     |
|    explained_variance   | -2.29     |
|    learning_rate        | 1e-06     |
|    loss                 | 0.21      |
|    n_updates            | 5290      |
|    policy_gradient_loss | -0.00906  |
|    value_loss           | 0.479     |
---------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 531          |
|    time_elapsed         | 3261         |
|    total_timesteps      | 271872       |
| train/              

-----------------------------------------
| time/                   |             |
|    fps                  | 83          |
|    iterations           | 541         |
|    time_elapsed         | 3328        |
|    total_timesteps      | 276992      |
| train/                  |             |
|    approx_kl            | 0.002111446 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.37       |
|    explained_variance   | -0.623      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.258       |
|    n_updates            | 5400        |
|    policy_gradient_loss | -0.00307    |
|    value_loss           | 0.555       |
-----------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 83          |
|    iterations           | 542         |
|    time_elapsed         | 3334        |
|    total_timesteps      | 277504

-------------------------------------------
| time/                   |               |
|    fps                  | 83            |
|    iterations           | 552           |
|    time_elapsed         | 3403          |
|    total_timesteps      | 282624        |
| train/                  |               |
|    approx_kl            | 0.00062394154 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -1.2          |
|    explained_variance   | -0.956        |
|    learning_rate        | 1e-06         |
|    loss                 | 0.313         |
|    n_updates            | 5510          |
|    policy_gradient_loss | -0.000917     |
|    value_loss           | 0.429         |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 83           |
|    iterations           | 553          |
|    time_elapsed         | 3409    

------------------------------------------
| time/                   |              |
|    fps                  | 82           |
|    iterations           | 563          |
|    time_elapsed         | 3476         |
|    total_timesteps      | 288256       |
| train/                  |              |
|    approx_kl            | 0.0026426893 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.05        |
|    explained_variance   | -1.11        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.211        |
|    n_updates            | 5620         |
|    policy_gradient_loss | -0.00164     |
|    value_loss           | 0.539        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 82            |
|    iterations           | 564           |
|    time_elapsed         | 3483          |
|    t

-----------------------------------------
| time/                   |             |
|    fps                  | 82          |
|    iterations           | 574         |
|    time_elapsed         | 3552        |
|    total_timesteps      | 293888      |
| train/                  |             |
|    approx_kl            | 0.004189033 |
|    clip_fraction        | 0.0291      |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.41       |
|    explained_variance   | -0.534      |
|    learning_rate        | 1e-06       |
|    loss                 | 0.0813      |
|    n_updates            | 5730        |
|    policy_gradient_loss | -0.0072     |
|    value_loss           | 0.207       |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 82           |
|    iterations           | 575          |
|    time_elapsed         | 3559         |
|    total_timesteps      | 2

------------------------------------------
| time/                   |              |
|    fps                  | 82           |
|    iterations           | 585          |
|    time_elapsed         | 3626         |
|    total_timesteps      | 299520       |
| train/                  |              |
|    approx_kl            | 0.0062944433 |
|    clip_fraction        | 0.0387       |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.36        |
|    explained_variance   | -0.296       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.077        |
|    n_updates            | 5840         |
|    policy_gradient_loss | -0.00631     |
|    value_loss           | 0.272        |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 82          |
|    iterations           | 586         |
|    time_elapsed         | 3633        |
|    total_times

------------------------------------------
| time/                   |              |
|    fps                  | 82           |
|    iterations           | 596          |
|    time_elapsed         | 3699         |
|    total_timesteps      | 305152       |
| train/                  |              |
|    approx_kl            | 0.0005857118 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.34        |
|    explained_variance   | -0.314       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.176        |
|    n_updates            | 5950         |
|    policy_gradient_loss | -0.000684    |
|    value_loss           | 0.472        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 82            |
|    iterations           | 597           |
|    time_elapsed         | 3706          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 82           |
|    iterations           | 607          |
|    time_elapsed         | 3776         |
|    total_timesteps      | 310784       |
| train/                  |              |
|    approx_kl            | 0.0010008877 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.17        |
|    explained_variance   | -0.625       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.114        |
|    n_updates            | 6060         |
|    policy_gradient_loss | -0.00137     |
|    value_loss           | 0.31         |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 82          |
|    iterations           | 608         |
|    time_elapsed         | 3783        |
|    total_times

-------------------------------------------
| time/                   |               |
|    fps                  | 82            |
|    iterations           | 618           |
|    time_elapsed         | 3853          |
|    total_timesteps      | 316416        |
| train/                  |               |
|    approx_kl            | 0.00041115202 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.784        |
|    explained_variance   | 0.878         |
|    learning_rate        | 1e-06         |
|    loss                 | 79.5          |
|    n_updates            | 6170          |
|    policy_gradient_loss | 0.000107      |
|    value_loss           | 199           |
-------------------------------------------
--------------------------------------------
| time/                   |                |
|    fps                  | 82             |
|    iterations           | 619            |
|    time_elapsed         | 

------------------------------------------
| time/                   |              |
|    fps                  | 81           |
|    iterations           | 629          |
|    time_elapsed         | 3935         |
|    total_timesteps      | 322048       |
| train/                  |              |
|    approx_kl            | 0.0009845768 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.725       |
|    explained_variance   | 0.87         |
|    learning_rate        | 1e-06        |
|    loss                 | 96.3         |
|    n_updates            | 6280         |
|    policy_gradient_loss | -0.00101     |
|    value_loss           | 146          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 81           |
|    iterations           | 630          |
|    time_elapsed         | 3942         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 81            |
|    iterations           | 640           |
|    time_elapsed         | 4012          |
|    total_timesteps      | 327680        |
| train/                  |               |
|    approx_kl            | 0.00076231675 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.609        |
|    explained_variance   | 0.618         |
|    learning_rate        | 1e-06         |
|    loss                 | 90            |
|    n_updates            | 6390          |
|    policy_gradient_loss | -0.00122      |
|    value_loss           | 247           |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 81          |
|    iterations           | 641         |
|    time_elapsed         | 4018        

-------------------------------------------
| time/                   |               |
|    fps                  | 81            |
|    iterations           | 651           |
|    time_elapsed         | 4086          |
|    total_timesteps      | 333312        |
| train/                  |               |
|    approx_kl            | 0.00037525012 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.595        |
|    explained_variance   | 0.6           |
|    learning_rate        | 1e-06         |
|    loss                 | 369           |
|    n_updates            | 6500          |
|    policy_gradient_loss | -0.00114      |
|    value_loss           | 561           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 81            |
|    iterations           | 652           |
|    time_elapsed         | 4093

-------------------------------------------
| time/                   |               |
|    fps                  | 81            |
|    iterations           | 662           |
|    time_elapsed         | 4160          |
|    total_timesteps      | 338944        |
| train/                  |               |
|    approx_kl            | 9.8526245e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.471        |
|    explained_variance   | 0.716         |
|    learning_rate        | 1e-06         |
|    loss                 | 87.3          |
|    n_updates            | 6610          |
|    policy_gradient_loss | 0.000321      |
|    value_loss           | 227           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 81            |
|    iterations           | 663           |
|    time_elapsed         | 4167

-----------------------------------------
| time/                   |             |
|    fps                  | 81          |
|    iterations           | 673         |
|    time_elapsed         | 4235        |
|    total_timesteps      | 344576      |
| train/                  |             |
|    approx_kl            | 0.002671239 |
|    clip_fraction        | 0.0246      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.618      |
|    explained_variance   | 0.559       |
|    learning_rate        | 1e-06       |
|    loss                 | 135         |
|    n_updates            | 6720        |
|    policy_gradient_loss | -0.00205    |
|    value_loss           | 491         |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 81           |
|    iterations           | 674          |
|    time_elapsed         | 4241         |
|    total_timesteps      | 3

------------------------------------------
| time/                   |              |
|    fps                  | 81           |
|    iterations           | 684          |
|    time_elapsed         | 4311         |
|    total_timesteps      | 350208       |
| train/                  |              |
|    approx_kl            | 0.0017255587 |
|    clip_fraction        | 0.00918      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.667       |
|    explained_variance   | 0.784        |
|    learning_rate        | 1e-06        |
|    loss                 | 83.8         |
|    n_updates            | 6830         |
|    policy_gradient_loss | -0.00304     |
|    value_loss           | 263          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 81            |
|    iterations           | 685           |
|    time_elapsed         | 4318          |
|    t

---------------------------------------
| time/                   |           |
|    fps                  | 81        |
|    iterations           | 695       |
|    time_elapsed         | 4386      |
|    total_timesteps      | 355840    |
| train/                  |           |
|    approx_kl            | 0.0025533 |
|    clip_fraction        | 0.00156   |
|    clip_range           | 0.2       |
|    entropy_loss         | -0.417    |
|    explained_variance   | 0.246     |
|    learning_rate        | 1e-06     |
|    loss                 | 296       |
|    n_updates            | 6940      |
|    policy_gradient_loss | -0.000962 |
|    value_loss           | 555       |
---------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 81           |
|    iterations           | 696          |
|    time_elapsed         | 4393         |
|    total_timesteps      | 356352       |
| train/              

------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 706          |
|    time_elapsed         | 4463         |
|    total_timesteps      | 361472       |
| train/                  |              |
|    approx_kl            | 0.0005455656 |
|    clip_fraction        | 0.00859      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.471       |
|    explained_variance   | 0.878        |
|    learning_rate        | 1e-06        |
|    loss                 | 76.2         |
|    n_updates            | 7050         |
|    policy_gradient_loss | -0.00178     |
|    value_loss           | 155          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 707           |
|    time_elapsed         | 4470          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 717          |
|    time_elapsed         | 4538         |
|    total_timesteps      | 367104       |
| train/                  |              |
|    approx_kl            | 0.0025983595 |
|    clip_fraction        | 0.00332      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.471       |
|    explained_variance   | 0.917        |
|    learning_rate        | 1e-06        |
|    loss                 | 52.8         |
|    n_updates            | 7160         |
|    policy_gradient_loss | -0.000661    |
|    value_loss           | 112          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 718           |
|    time_elapsed         | 4545          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 728           |
|    time_elapsed         | 4612          |
|    total_timesteps      | 372736        |
| train/                  |               |
|    approx_kl            | 0.00087025994 |
|    clip_fraction        | 0.00527       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.578        |
|    explained_variance   | 0.716         |
|    learning_rate        | 1e-06         |
|    loss                 | 102           |
|    n_updates            | 7270          |
|    policy_gradient_loss | -0.00147      |
|    value_loss           | 206           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 729          |
|    time_elapsed         | 4619    

-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 739           |
|    time_elapsed         | 4686          |
|    total_timesteps      | 378368        |
| train/                  |               |
|    approx_kl            | 0.00039434107 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.491        |
|    explained_variance   | 0.175         |
|    learning_rate        | 1e-06         |
|    loss                 | 345           |
|    n_updates            | 7380          |
|    policy_gradient_loss | -0.00104      |
|    value_loss           | 573           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 740          |
|    time_elapsed         | 4692    

------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 750          |
|    time_elapsed         | 4761         |
|    total_timesteps      | 384000       |
| train/                  |              |
|    approx_kl            | 0.0012853784 |
|    clip_fraction        | 0.00391      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.594       |
|    explained_variance   | 0.23         |
|    learning_rate        | 1e-06        |
|    loss                 | 137          |
|    n_updates            | 7490         |
|    policy_gradient_loss | -0.00274     |
|    value_loss           | 339          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 751          |
|    time_elapsed         | 4768         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 761          |
|    time_elapsed         | 4834         |
|    total_timesteps      | 389632       |
| train/                  |              |
|    approx_kl            | 0.0010924092 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.458       |
|    explained_variance   | 0.77         |
|    learning_rate        | 1e-06        |
|    loss                 | 50.1         |
|    n_updates            | 7600         |
|    policy_gradient_loss | 0.0001       |
|    value_loss           | 124          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 762          |
|    time_elapsed         | 4841         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 772          |
|    time_elapsed         | 4909         |
|    total_timesteps      | 395264       |
| train/                  |              |
|    approx_kl            | 3.084296e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.29        |
|    explained_variance   | 0.79         |
|    learning_rate        | 1e-06        |
|    loss                 | 167          |
|    n_updates            | 7710         |
|    policy_gradient_loss | -5.12e-05    |
|    value_loss           | 346          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 773           |
|    time_elapsed         | 4916          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 783          |
|    time_elapsed         | 4983         |
|    total_timesteps      | 400896       |
| train/                  |              |
|    approx_kl            | 8.021074e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.19        |
|    explained_variance   | 0.376        |
|    learning_rate        | 1e-06        |
|    loss                 | 402          |
|    n_updates            | 7820         |
|    policy_gradient_loss | -0.000523    |
|    value_loss           | 461          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 784          |
|    time_elapsed         | 4990         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 794           |
|    time_elapsed         | 5057          |
|    total_timesteps      | 406528        |
| train/                  |               |
|    approx_kl            | 0.00011369854 |
|    clip_fraction        | 0.000195      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.192        |
|    explained_variance   | 0.885         |
|    learning_rate        | 1e-06         |
|    loss                 | 55.6          |
|    n_updates            | 7930          |
|    policy_gradient_loss | -0.000355     |
|    value_loss           | 120           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 795          |
|    time_elapsed         | 5063    

-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 805           |
|    time_elapsed         | 5132          |
|    total_timesteps      | 412160        |
| train/                  |               |
|    approx_kl            | 0.00010541978 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.239        |
|    explained_variance   | -0.516        |
|    learning_rate        | 1e-06         |
|    loss                 | 405           |
|    n_updates            | 8040          |
|    policy_gradient_loss | -6e-05        |
|    value_loss           | 913           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 806           |
|    time_elapsed         | 5138

-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 816           |
|    time_elapsed         | 5208          |
|    total_timesteps      | 417792        |
| train/                  |               |
|    approx_kl            | 0.00050899154 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.397        |
|    explained_variance   | 0.684         |
|    learning_rate        | 1e-06         |
|    loss                 | 127           |
|    n_updates            | 8150          |
|    policy_gradient_loss | -0.00047      |
|    value_loss           | 259           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 80            |
|    iterations           | 817           |
|    time_elapsed         | 5215

------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 827          |
|    time_elapsed         | 5285         |
|    total_timesteps      | 423424       |
| train/                  |              |
|    approx_kl            | 0.0015512098 |
|    clip_fraction        | 0.0105       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.326       |
|    explained_variance   | 0.523        |
|    learning_rate        | 1e-06        |
|    loss                 | 276          |
|    n_updates            | 8260         |
|    policy_gradient_loss | -0.0021      |
|    value_loss           | 487          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 828          |
|    time_elapsed         | 5292         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 838          |
|    time_elapsed         | 5361         |
|    total_timesteps      | 429056       |
| train/                  |              |
|    approx_kl            | 0.0009797598 |
|    clip_fraction        | 0.00508      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.31        |
|    explained_variance   | 0.638        |
|    learning_rate        | 1e-06        |
|    loss                 | 254          |
|    n_updates            | 8370         |
|    policy_gradient_loss | -0.00176     |
|    value_loss           | 369          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 80           |
|    iterations           | 839          |
|    time_elapsed         | 5368         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 849          |
|    time_elapsed         | 5435         |
|    total_timesteps      | 434688       |
| train/                  |              |
|    approx_kl            | 0.0013429945 |
|    clip_fraction        | 0.00234      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.309       |
|    explained_variance   | 0.91         |
|    learning_rate        | 1e-06        |
|    loss                 | 52.1         |
|    n_updates            | 8480         |
|    policy_gradient_loss | -0.00164     |
|    value_loss           | 96.7         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 850          |
|    time_elapsed         | 5443         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 860           |
|    time_elapsed         | 5512          |
|    total_timesteps      | 440320        |
| train/                  |               |
|    approx_kl            | 0.00018197775 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.314        |
|    explained_variance   | 0.651         |
|    learning_rate        | 1e-06         |
|    loss                 | 103           |
|    n_updates            | 8590          |
|    policy_gradient_loss | 0.000116      |
|    value_loss           | 212           |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 79          |
|    iterations           | 861         |
|    time_elapsed         | 5519        

-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 871           |
|    time_elapsed         | 5588          |
|    total_timesteps      | 445952        |
| train/                  |               |
|    approx_kl            | 0.00095472776 |
|    clip_fraction        | 0.024         |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.316        |
|    explained_variance   | 0.733         |
|    learning_rate        | 1e-06         |
|    loss                 | 55.1          |
|    n_updates            | 8700          |
|    policy_gradient_loss | -0.00192      |
|    value_loss           | 137           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 872           |
|    time_elapsed         | 5595

------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 882          |
|    time_elapsed         | 5662         |
|    total_timesteps      | 451584       |
| train/                  |              |
|    approx_kl            | 0.0020447061 |
|    clip_fraction        | 0.0166       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.499       |
|    explained_variance   | 0.797        |
|    learning_rate        | 1e-06        |
|    loss                 | 87.5         |
|    n_updates            | 8810         |
|    policy_gradient_loss | -0.00239     |
|    value_loss           | 158          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 883           |
|    time_elapsed         | 5669          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 893          |
|    time_elapsed         | 5737         |
|    total_timesteps      | 457216       |
| train/                  |              |
|    approx_kl            | 0.0004251767 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.778       |
|    explained_variance   | 0.716        |
|    learning_rate        | 1e-06        |
|    loss                 | 113          |
|    n_updates            | 8920         |
|    policy_gradient_loss | 0.00018      |
|    value_loss           | 184          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 894           |
|    time_elapsed         | 5744          |
|    t

-----------------------------------------
| time/                   |             |
|    fps                  | 79          |
|    iterations           | 904         |
|    time_elapsed         | 5812        |
|    total_timesteps      | 462848      |
| train/                  |             |
|    approx_kl            | 0.003743987 |
|    clip_fraction        | 0.0043      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.835      |
|    explained_variance   | 0.759       |
|    learning_rate        | 1e-06       |
|    loss                 | 97.5        |
|    n_updates            | 9030        |
|    policy_gradient_loss | -0.00322    |
|    value_loss           | 216         |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 905          |
|    time_elapsed         | 5818         |
|    total_timesteps      | 4

-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 915           |
|    time_elapsed         | 5887          |
|    total_timesteps      | 468480        |
| train/                  |               |
|    approx_kl            | 0.00018767256 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.787        |
|    explained_variance   | 0.668         |
|    learning_rate        | 1e-06         |
|    loss                 | 46.5          |
|    n_updates            | 9140          |
|    policy_gradient_loss | -6.95e-05     |
|    value_loss           | 128           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 916          |
|    time_elapsed         | 5893    

------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 926          |
|    time_elapsed         | 5960         |
|    total_timesteps      | 474112       |
| train/                  |              |
|    approx_kl            | 0.0052830945 |
|    clip_fraction        | 0.0127       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.68        |
|    explained_variance   | 0.541        |
|    learning_rate        | 1e-06        |
|    loss                 | 36.9         |
|    n_updates            | 9250         |
|    policy_gradient_loss | -0.00264     |
|    value_loss           | 314          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 927           |
|    time_elapsed         | 5966          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 937           |
|    time_elapsed         | 6034          |
|    total_timesteps      | 479744        |
| train/                  |               |
|    approx_kl            | 0.00020378479 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.677        |
|    explained_variance   | 0.464         |
|    learning_rate        | 1e-06         |
|    loss                 | 212           |
|    n_updates            | 9360          |
|    policy_gradient_loss | 0.000228      |
|    value_loss           | 617           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 938           |
|    time_elapsed         | 6041

-----------------------------------------
| time/                   |             |
|    fps                  | 79          |
|    iterations           | 948         |
|    time_elapsed         | 6113        |
|    total_timesteps      | 485376      |
| train/                  |             |
|    approx_kl            | 0.003089203 |
|    clip_fraction        | 0.00645     |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.661      |
|    explained_variance   | 0.675       |
|    learning_rate        | 1e-06       |
|    loss                 | 101         |
|    n_updates            | 9470        |
|    policy_gradient_loss | -0.00269    |
|    value_loss           | 323         |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 949          |
|    time_elapsed         | 6120         |
|    total_timesteps      | 4

------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 959          |
|    time_elapsed         | 6189         |
|    total_timesteps      | 491008       |
| train/                  |              |
|    approx_kl            | 0.0011713316 |
|    clip_fraction        | 0.0191       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.535       |
|    explained_variance   | 0.177        |
|    learning_rate        | 1e-06        |
|    loss                 | 130          |
|    n_updates            | 9580         |
|    policy_gradient_loss | -0.000311    |
|    value_loss           | 207          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 960           |
|    time_elapsed         | 6196          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 970           |
|    time_elapsed         | 6265          |
|    total_timesteps      | 496640        |
| train/                  |               |
|    approx_kl            | 0.00022472546 |
|    clip_fraction        | 0.00137       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.346        |
|    explained_variance   | 0.687         |
|    learning_rate        | 1e-06         |
|    loss                 | 60.8          |
|    n_updates            | 9690          |
|    policy_gradient_loss | -3.2e-05      |
|    value_loss           | 123           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 971          |
|    time_elapsed         | 6272    

------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 981          |
|    time_elapsed         | 6340         |
|    total_timesteps      | 502272       |
| train/                  |              |
|    approx_kl            | 5.244941e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.26        |
|    explained_variance   | 0.526        |
|    learning_rate        | 1e-06        |
|    loss                 | 431          |
|    n_updates            | 9800         |
|    policy_gradient_loss | 9.88e-05     |
|    value_loss           | 706          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 982          |
|    time_elapsed         | 6347         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 992           |
|    time_elapsed         | 6413          |
|    total_timesteps      | 507904        |
| train/                  |               |
|    approx_kl            | 0.00023169233 |
|    clip_fraction        | 0.00391       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.188        |
|    explained_variance   | 0.776         |
|    learning_rate        | 1e-06         |
|    loss                 | 68.1          |
|    n_updates            | 9910          |
|    policy_gradient_loss | -0.00169      |
|    value_loss           | 179           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 993           |
|    time_elapsed         | 6420

------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 1003         |
|    time_elapsed         | 6492         |
|    total_timesteps      | 513536       |
| train/                  |              |
|    approx_kl            | 0.0015788905 |
|    clip_fraction        | 0.0154       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.275       |
|    explained_variance   | 0.867        |
|    learning_rate        | 1e-06        |
|    loss                 | 58.8         |
|    n_updates            | 10020        |
|    policy_gradient_loss | -0.00209     |
|    value_loss           | 165          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 79           |
|    iterations           | 1004         |
|    time_elapsed         | 6499         |
|    total_

-----------------------------------------
| time/                   |             |
|    fps                  | 79          |
|    iterations           | 1014        |
|    time_elapsed         | 6569        |
|    total_timesteps      | 519168      |
| train/                  |             |
|    approx_kl            | 0.001949615 |
|    clip_fraction        | 0.0127      |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.335      |
|    explained_variance   | 0.873       |
|    learning_rate        | 1e-06       |
|    loss                 | 92.7        |
|    n_updates            | 10130       |
|    policy_gradient_loss | -0.000874   |
|    value_loss           | 223         |
-----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 79            |
|    iterations           | 1015          |
|    time_elapsed         | 6576          |
|    total_timesteps    

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1025          |
|    time_elapsed         | 6646          |
|    total_timesteps      | 524800        |
| train/                  |               |
|    approx_kl            | 0.00082924066 |
|    clip_fraction        | 0.00605       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.364        |
|    explained_variance   | 0.921         |
|    learning_rate        | 1e-06         |
|    loss                 | 31.7          |
|    n_updates            | 10240         |
|    policy_gradient_loss | -0.00153      |
|    value_loss           | 79.9          |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1026         |
|    time_elapsed         | 6653    

------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1036         |
|    time_elapsed         | 6722         |
|    total_timesteps      | 530432       |
| train/                  |              |
|    approx_kl            | 0.0026651323 |
|    clip_fraction        | 0.023        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.362       |
|    explained_variance   | -0.239       |
|    learning_rate        | 1e-06        |
|    loss                 | 143          |
|    n_updates            | 10350        |
|    policy_gradient_loss | -0.00264     |
|    value_loss           | 291          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1037         |
|    time_elapsed         | 6730         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1047          |
|    time_elapsed         | 6801          |
|    total_timesteps      | 536064        |
| train/                  |               |
|    approx_kl            | 0.00038500794 |
|    clip_fraction        | 0.00605       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.207        |
|    explained_variance   | 0.681         |
|    learning_rate        | 1e-06         |
|    loss                 | 353           |
|    n_updates            | 10460         |
|    policy_gradient_loss | -0.000513     |
|    value_loss           | 522           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1048          |
|    time_elapsed         | 6808

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1058          |
|    time_elapsed         | 6879          |
|    total_timesteps      | 541696        |
| train/                  |               |
|    approx_kl            | 1.9541243e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.184        |
|    explained_variance   | 0.852         |
|    learning_rate        | 1e-06         |
|    loss                 | 69.6          |
|    n_updates            | 10570         |
|    policy_gradient_loss | -8.42e-05     |
|    value_loss           | 156           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1059         |
|    time_elapsed         | 6886    

------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1069         |
|    time_elapsed         | 6954         |
|    total_timesteps      | 547328       |
| train/                  |              |
|    approx_kl            | 0.0013917709 |
|    clip_fraction        | 0.0041       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.366       |
|    explained_variance   | 0.768        |
|    learning_rate        | 1e-06        |
|    loss                 | 112          |
|    n_updates            | 10680        |
|    policy_gradient_loss | -0.00318     |
|    value_loss           | 374          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1070          |
|    time_elapsed         | 6961          |
|    t

-----------------------------------------
| time/                   |             |
|    fps                  | 78          |
|    iterations           | 1080        |
|    time_elapsed         | 7032        |
|    total_timesteps      | 552960      |
| train/                  |             |
|    approx_kl            | 0.011526136 |
|    clip_fraction        | 0.0193      |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.6        |
|    explained_variance   | -0.66       |
|    learning_rate        | 1e-06       |
|    loss                 | 1.3         |
|    n_updates            | 10790       |
|    policy_gradient_loss | -0.00481    |
|    value_loss           | 6.62        |
-----------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 78          |
|    iterations           | 1081        |
|    time_elapsed         | 7039        |
|    total_timesteps      | 553472

------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1091         |
|    time_elapsed         | 7106         |
|    total_timesteps      | 558592       |
| train/                  |              |
|    approx_kl            | 0.0024206708 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.64        |
|    explained_variance   | -0.163       |
|    learning_rate        | 1e-06        |
|    loss                 | 0.145        |
|    n_updates            | 10900        |
|    policy_gradient_loss | -0.00306     |
|    value_loss           | 0.474        |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1092         |
|    time_elapsed         | 7113         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1102          |
|    time_elapsed         | 7181          |
|    total_timesteps      | 564224        |
| train/                  |               |
|    approx_kl            | 0.00014581054 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.351        |
|    explained_variance   | 0.804         |
|    learning_rate        | 1e-06         |
|    loss                 | 67.8          |
|    n_updates            | 11010         |
|    policy_gradient_loss | 5.65e-05      |
|    value_loss           | 111           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1103          |
|    time_elapsed         | 7188

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1113          |
|    time_elapsed         | 7259          |
|    total_timesteps      | 569856        |
| train/                  |               |
|    approx_kl            | 0.00046258897 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.458        |
|    explained_variance   | 0.634         |
|    learning_rate        | 1e-06         |
|    loss                 | 130           |
|    n_updates            | 11120         |
|    policy_gradient_loss | -0.000586     |
|    value_loss           | 338           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1114          |
|    time_elapsed         | 7265

--------------------------------------------
| time/                   |                |
|    fps                  | 78             |
|    iterations           | 1124           |
|    time_elapsed         | 7334           |
|    total_timesteps      | 575488         |
| train/                  |                |
|    approx_kl            | 1.40634365e-05 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -0.29          |
|    explained_variance   | 0.755          |
|    learning_rate        | 1e-06          |
|    loss                 | 41.3           |
|    n_updates            | 11230          |
|    policy_gradient_loss | 5.41e-05       |
|    value_loss           | 93.8           |
--------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1125          |
|    time_elap

------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1135         |
|    time_elapsed         | 7411         |
|    total_timesteps      | 581120       |
| train/                  |              |
|    approx_kl            | 0.0006318453 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.42        |
|    explained_variance   | 0.766        |
|    learning_rate        | 1e-06        |
|    loss                 | 82.9         |
|    n_updates            | 11340        |
|    policy_gradient_loss | -0.000322    |
|    value_loss           | 160          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1136          |
|    time_elapsed         | 7419          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1146          |
|    time_elapsed         | 7486          |
|    total_timesteps      | 586752        |
| train/                  |               |
|    approx_kl            | 0.00074760383 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.412        |
|    explained_variance   | 0.839         |
|    learning_rate        | 1e-06         |
|    loss                 | 60.1          |
|    n_updates            | 11450         |
|    policy_gradient_loss | -0.000324     |
|    value_loss           | 145           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1147         |
|    time_elapsed         | 7493    

------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1157         |
|    time_elapsed         | 7560         |
|    total_timesteps      | 592384       |
| train/                  |              |
|    approx_kl            | 0.0013638558 |
|    clip_fraction        | 0.0109       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.368       |
|    explained_variance   | 0.613        |
|    learning_rate        | 1e-06        |
|    loss                 | 170          |
|    n_updates            | 11560        |
|    policy_gradient_loss | -0.00181     |
|    value_loss           | 291          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1158          |
|    time_elapsed         | 7567          |
|    t

--------------------------------------------
| time/                   |                |
|    fps                  | 78             |
|    iterations           | 1168           |
|    time_elapsed         | 7635           |
|    total_timesteps      | 598016         |
| train/                  |                |
|    approx_kl            | 0.000105767045 |
|    clip_fraction        | 0              |
|    clip_range           | 0.2            |
|    entropy_loss         | -0.198         |
|    explained_variance   | 0.903          |
|    learning_rate        | 1e-06          |
|    loss                 | 87             |
|    n_updates            | 11670          |
|    policy_gradient_loss | -0.00018       |
|    value_loss           | 152            |
--------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1169         |
|    time_elapsed 

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1179          |
|    time_elapsed         | 7709          |
|    total_timesteps      | 603648        |
| train/                  |               |
|    approx_kl            | 0.00035934534 |
|    clip_fraction        | 0.000586      |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.135        |
|    explained_variance   | 0.804         |
|    learning_rate        | 1e-06         |
|    loss                 | 72.2          |
|    n_updates            | 11780         |
|    policy_gradient_loss | -0.000485     |
|    value_loss           | 172           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1180          |
|    time_elapsed         | 7716

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1190          |
|    time_elapsed         | 7783          |
|    total_timesteps      | 609280        |
| train/                  |               |
|    approx_kl            | 0.00046491716 |
|    clip_fraction        | 0.00293       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.111        |
|    explained_variance   | 0.902         |
|    learning_rate        | 1e-06         |
|    loss                 | 63.1          |
|    n_updates            | 11890         |
|    policy_gradient_loss | -0.000682     |
|    value_loss           | 145           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1191          |
|    time_elapsed         | 7789

------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1201         |
|    time_elapsed         | 7856         |
|    total_timesteps      | 614912       |
| train/                  |              |
|    approx_kl            | 0.0005330398 |
|    clip_fraction        | 0.00332      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.0956      |
|    explained_variance   | 0.898        |
|    learning_rate        | 1e-06        |
|    loss                 | 53.3         |
|    n_updates            | 12000        |
|    policy_gradient_loss | -0.000941    |
|    value_loss           | 114          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1202          |
|    time_elapsed         | 7863          |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1212          |
|    time_elapsed         | 7934          |
|    total_timesteps      | 620544        |
| train/                  |               |
|    approx_kl            | 4.8801303e-07 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.0723       |
|    explained_variance   | 0.465         |
|    learning_rate        | 1e-06         |
|    loss                 | 148           |
|    n_updates            | 12110         |
|    policy_gradient_loss | 3.43e-05      |
|    value_loss           | 433           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1213          |
|    time_elapsed         | 7941

------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1223         |
|    time_elapsed         | 8011         |
|    total_timesteps      | 626176       |
| train/                  |              |
|    approx_kl            | 0.0005622783 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.212       |
|    explained_variance   | 0.839        |
|    learning_rate        | 1e-06        |
|    loss                 | 198          |
|    n_updates            | 12220        |
|    policy_gradient_loss | -0.000169    |
|    value_loss           | 361          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1224          |
|    time_elapsed         | 8018          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1234         |
|    time_elapsed         | 8088         |
|    total_timesteps      | 631808       |
| train/                  |              |
|    approx_kl            | 0.0010541026 |
|    clip_fraction        | 0.0252       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.243       |
|    explained_variance   | 0.885        |
|    learning_rate        | 1e-06        |
|    loss                 | 43.1         |
|    n_updates            | 12330        |
|    policy_gradient_loss | -0.00224     |
|    value_loss           | 109          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1235         |
|    time_elapsed         | 8095         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1245         |
|    time_elapsed         | 8165         |
|    total_timesteps      | 637440       |
| train/                  |              |
|    approx_kl            | 0.0008473715 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.471       |
|    explained_variance   | 0.784        |
|    learning_rate        | 1e-06        |
|    loss                 | 172          |
|    n_updates            | 12440        |
|    policy_gradient_loss | -0.000703    |
|    value_loss           | 250          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 78           |
|    iterations           | 1246         |
|    time_elapsed         | 8172         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1256          |
|    time_elapsed         | 8243          |
|    total_timesteps      | 643072        |
| train/                  |               |
|    approx_kl            | 0.00027170847 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.239        |
|    explained_variance   | 0.892         |
|    learning_rate        | 1e-06         |
|    loss                 | 32.1          |
|    n_updates            | 12550         |
|    policy_gradient_loss | -0.000102     |
|    value_loss           | 109           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 78            |
|    iterations           | 1257          |
|    time_elapsed         | 8250

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1267          |
|    time_elapsed         | 8319          |
|    total_timesteps      | 648704        |
| train/                  |               |
|    approx_kl            | 0.00035866187 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.174        |
|    explained_variance   | 0.67          |
|    learning_rate        | 1e-06         |
|    loss                 | 234           |
|    n_updates            | 12660         |
|    policy_gradient_loss | -0.000415     |
|    value_loss           | 278           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1268          |
|    time_elapsed         | 8327

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1278         |
|    time_elapsed         | 8397         |
|    total_timesteps      | 654336       |
| train/                  |              |
|    approx_kl            | 0.0018062589 |
|    clip_fraction        | 0.00527      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.333       |
|    explained_variance   | 0.921        |
|    learning_rate        | 1e-06        |
|    loss                 | 47.6         |
|    n_updates            | 12770        |
|    policy_gradient_loss | -0.00088     |
|    value_loss           | 118          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1279          |
|    time_elapsed         | 8405          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1289         |
|    time_elapsed         | 8477         |
|    total_timesteps      | 659968       |
| train/                  |              |
|    approx_kl            | 0.0001268289 |
|    clip_fraction        | 0.000977     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.327       |
|    explained_variance   | 0.568        |
|    learning_rate        | 1e-06        |
|    loss                 | 8.04         |
|    n_updates            | 12880        |
|    policy_gradient_loss | -0.000306    |
|    value_loss           | 30.6         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1290         |
|    time_elapsed         | 8484         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1300         |
|    time_elapsed         | 8554         |
|    total_timesteps      | 665600       |
| train/                  |              |
|    approx_kl            | 0.0022134176 |
|    clip_fraction        | 0.0107       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.38        |
|    explained_variance   | 0.574        |
|    learning_rate        | 1e-06        |
|    loss                 | 185          |
|    n_updates            | 12990        |
|    policy_gradient_loss | -0.00206     |
|    value_loss           | 542          |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 77          |
|    iterations           | 1301        |
|    time_elapsed         | 8562        |
|    total_times

-----------------------------------------
| time/                   |             |
|    fps                  | 77          |
|    iterations           | 1311        |
|    time_elapsed         | 8630        |
|    total_timesteps      | 671232      |
| train/                  |             |
|    approx_kl            | 0.003440625 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.426      |
|    explained_variance   | 0.908       |
|    learning_rate        | 1e-06       |
|    loss                 | 77.1        |
|    n_updates            | 13100       |
|    policy_gradient_loss | -0.0012     |
|    value_loss           | 141         |
-----------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 77          |
|    iterations           | 1312        |
|    time_elapsed         | 8637        |
|    total_timesteps      | 671744

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1322         |
|    time_elapsed         | 8707         |
|    total_timesteps      | 676864       |
| train/                  |              |
|    approx_kl            | 9.800657e-06 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.382       |
|    explained_variance   | -0.203       |
|    learning_rate        | 1e-06        |
|    loss                 | 381          |
|    n_updates            | 13210        |
|    policy_gradient_loss | 2.92e-05     |
|    value_loss           | 861          |
------------------------------------------
----------------------------------------
| time/                   |            |
|    fps                  | 77         |
|    iterations           | 1323       |
|    time_elapsed         | 8715       |
|    total_timesteps 

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1333          |
|    time_elapsed         | 8784          |
|    total_timesteps      | 682496        |
| train/                  |               |
|    approx_kl            | 0.00026175322 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.358        |
|    explained_variance   | 0.818         |
|    learning_rate        | 1e-06         |
|    loss                 | 237           |
|    n_updates            | 13320         |
|    policy_gradient_loss | -0.000304     |
|    value_loss           | 291           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1334          |
|    time_elapsed         | 8791

---------------------------------------
| time/                   |           |
|    fps                  | 77        |
|    iterations           | 1344      |
|    time_elapsed         | 8860      |
|    total_timesteps      | 688128    |
| train/                  |           |
|    approx_kl            | 0.0019786 |
|    clip_fraction        | 0.0219    |
|    clip_range           | 0.2       |
|    entropy_loss         | -0.251    |
|    explained_variance   | 0.885     |
|    learning_rate        | 1e-06     |
|    loss                 | 51.4      |
|    n_updates            | 13430     |
|    policy_gradient_loss | -0.00242  |
|    value_loss           | 142       |
---------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1345          |
|    time_elapsed         | 8867          |
|    total_timesteps      | 688640        |
| train/        

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1355         |
|    time_elapsed         | 8935         |
|    total_timesteps      | 693760       |
| train/                  |              |
|    approx_kl            | 0.0013879648 |
|    clip_fraction        | 0.0152       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.19        |
|    explained_variance   | 0.766        |
|    learning_rate        | 1e-06        |
|    loss                 | 74.9         |
|    n_updates            | 13540        |
|    policy_gradient_loss | -0.00131     |
|    value_loss           | 145          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1356         |
|    time_elapsed         | 8941         |
|    total_

-----------------------------------------
| time/                   |             |
|    fps                  | 77          |
|    iterations           | 1366        |
|    time_elapsed         | 9011        |
|    total_timesteps      | 699392      |
| train/                  |             |
|    approx_kl            | 5.35571e-05 |
|    clip_fraction        | 0           |
|    clip_range           | 0.2         |
|    entropy_loss         | -0.19       |
|    explained_variance   | 0.85        |
|    learning_rate        | 1e-06       |
|    loss                 | 185         |
|    n_updates            | 13650       |
|    policy_gradient_loss | -6.18e-05   |
|    value_loss           | 374         |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1367         |
|    time_elapsed         | 9018         |
|    total_timesteps      | 6

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1377          |
|    time_elapsed         | 9088          |
|    total_timesteps      | 705024        |
| train/                  |               |
|    approx_kl            | 5.5882847e-06 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.143        |
|    explained_variance   | 0.651         |
|    learning_rate        | 1e-06         |
|    loss                 | 415           |
|    n_updates            | 13760         |
|    policy_gradient_loss | -1.29e-05     |
|    value_loss           | 535           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1378          |
|    time_elapsed         | 9095

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1388         |
|    time_elapsed         | 9164         |
|    total_timesteps      | 710656       |
| train/                  |              |
|    approx_kl            | 0.0009466553 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.22        |
|    explained_variance   | 0.768        |
|    learning_rate        | 1e-06        |
|    loss                 | 143          |
|    n_updates            | 13870        |
|    policy_gradient_loss | -0.000301    |
|    value_loss           | 399          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1389          |
|    time_elapsed         | 9171          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1399         |
|    time_elapsed         | 9238         |
|    total_timesteps      | 716288       |
| train/                  |              |
|    approx_kl            | 0.0013167929 |
|    clip_fraction        | 0.0254       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.154       |
|    explained_variance   | 0.82         |
|    learning_rate        | 1e-06        |
|    loss                 | 77.2         |
|    n_updates            | 13980        |
|    policy_gradient_loss | -0.00269     |
|    value_loss           | 186          |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 77          |
|    iterations           | 1400        |
|    time_elapsed         | 9245        |
|    total_times

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1410          |
|    time_elapsed         | 9312          |
|    total_timesteps      | 721920        |
| train/                  |               |
|    approx_kl            | 3.7518214e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.177        |
|    explained_variance   | 0.772         |
|    learning_rate        | 1e-06         |
|    loss                 | 89.6          |
|    n_updates            | 14090         |
|    policy_gradient_loss | 1.87e-05      |
|    value_loss           | 205           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1411          |
|    time_elapsed         | 9319

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1421          |
|    time_elapsed         | 9387          |
|    total_timesteps      | 727552        |
| train/                  |               |
|    approx_kl            | 2.9161107e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.171        |
|    explained_variance   | 0.747         |
|    learning_rate        | 1e-06         |
|    loss                 | 117           |
|    n_updates            | 14200         |
|    policy_gradient_loss | 0.000101      |
|    value_loss           | 242           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1422          |
|    time_elapsed         | 9394

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1432         |
|    time_elapsed         | 9465         |
|    total_timesteps      | 733184       |
| train/                  |              |
|    approx_kl            | 0.0014415476 |
|    clip_fraction        | 0.0193       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.166       |
|    explained_variance   | 0.447        |
|    learning_rate        | 1e-06        |
|    loss                 | 358          |
|    n_updates            | 14310        |
|    policy_gradient_loss | -0.00156     |
|    value_loss           | 639          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1433          |
|    time_elapsed         | 9473          |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1443         |
|    time_elapsed         | 9542         |
|    total_timesteps      | 738816       |
| train/                  |              |
|    approx_kl            | 0.0005559431 |
|    clip_fraction        | 0.0113       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.188       |
|    explained_variance   | 0.761        |
|    learning_rate        | 1e-06        |
|    loss                 | 282          |
|    n_updates            | 14420        |
|    policy_gradient_loss | -0.00102     |
|    value_loss           | 410          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1444         |
|    time_elapsed         | 9549         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1454         |
|    time_elapsed         | 9619         |
|    total_timesteps      | 744448       |
| train/                  |              |
|    approx_kl            | 0.0008360428 |
|    clip_fraction        | 0.0043       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.206       |
|    explained_variance   | 0.812        |
|    learning_rate        | 1e-06        |
|    loss                 | 119          |
|    n_updates            | 14530        |
|    policy_gradient_loss | -0.000171    |
|    value_loss           | 262          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1455         |
|    time_elapsed         | 9625         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1465         |
|    time_elapsed         | 9692         |
|    total_timesteps      | 750080       |
| train/                  |              |
|    approx_kl            | 0.0034054038 |
|    clip_fraction        | 0.0385       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.273       |
|    explained_variance   | 0.925        |
|    learning_rate        | 1e-06        |
|    loss                 | 83.7         |
|    n_updates            | 14640        |
|    policy_gradient_loss | -0.00227     |
|    value_loss           | 208          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1466         |
|    time_elapsed         | 9698         |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1476         |
|    time_elapsed         | 9765         |
|    total_timesteps      | 755712       |
| train/                  |              |
|    approx_kl            | 0.0024265395 |
|    clip_fraction        | 0.0084       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.389       |
|    explained_variance   | 0.579        |
|    learning_rate        | 1e-06        |
|    loss                 | 260          |
|    n_updates            | 14750        |
|    policy_gradient_loss | -0.00131     |
|    value_loss           | 653          |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 77          |
|    iterations           | 1477        |
|    time_elapsed         | 9771        |
|    total_times

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1487          |
|    time_elapsed         | 9839          |
|    total_timesteps      | 761344        |
| train/                  |               |
|    approx_kl            | 0.00010676938 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.248        |
|    explained_variance   | 0.744         |
|    learning_rate        | 1e-06         |
|    loss                 | 92.3          |
|    n_updates            | 14860         |
|    policy_gradient_loss | 7.19e-05      |
|    value_loss           | 163           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1488         |
|    time_elapsed         | 9846    

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1498         |
|    time_elapsed         | 9915         |
|    total_timesteps      | 766976       |
| train/                  |              |
|    approx_kl            | 0.0015971405 |
|    clip_fraction        | 0.0164       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.238       |
|    explained_variance   | 0.819        |
|    learning_rate        | 1e-06        |
|    loss                 | 51           |
|    n_updates            | 14970        |
|    policy_gradient_loss | -0.00264     |
|    value_loss           | 158          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1499         |
|    time_elapsed         | 9922         |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1509          |
|    time_elapsed         | 9991          |
|    total_timesteps      | 772608        |
| train/                  |               |
|    approx_kl            | 0.00015297101 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.18         |
|    explained_variance   | 0.365         |
|    learning_rate        | 1e-06         |
|    loss                 | 94.8          |
|    n_updates            | 15080         |
|    policy_gradient_loss | 7.64e-05      |
|    value_loss           | 661           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1510         |
|    time_elapsed         | 9998    

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1520         |
|    time_elapsed         | 10067        |
|    total_timesteps      | 778240       |
| train/                  |              |
|    approx_kl            | 0.0008822117 |
|    clip_fraction        | 0.0195       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.211       |
|    explained_variance   | 0.729        |
|    learning_rate        | 1e-06        |
|    loss                 | 80.8         |
|    n_updates            | 15190        |
|    policy_gradient_loss | -0.00271     |
|    value_loss           | 157          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1521         |
|    time_elapsed         | 10073        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1531          |
|    time_elapsed         | 10141         |
|    total_timesteps      | 783872        |
| train/                  |               |
|    approx_kl            | 0.00032706955 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.226        |
|    explained_variance   | 0.847         |
|    learning_rate        | 1e-06         |
|    loss                 | 76.4          |
|    n_updates            | 15300         |
|    policy_gradient_loss | -0.000551     |
|    value_loss           | 134           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1532         |
|    time_elapsed         | 10148   

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1542          |
|    time_elapsed         | 10218         |
|    total_timesteps      | 789504        |
| train/                  |               |
|    approx_kl            | 0.00028577528 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.217        |
|    explained_variance   | 0.816         |
|    learning_rate        | 1e-06         |
|    loss                 | 72.3          |
|    n_updates            | 15410         |
|    policy_gradient_loss | -0.000208     |
|    value_loss           | 145           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1543         |
|    time_elapsed         | 10225   

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1553          |
|    time_elapsed         | 10293         |
|    total_timesteps      | 795136        |
| train/                  |               |
|    approx_kl            | 0.00050752447 |
|    clip_fraction        | 0.00664       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.191        |
|    explained_variance   | 0.886         |
|    learning_rate        | 1e-06         |
|    loss                 | 55.5          |
|    n_updates            | 15520         |
|    policy_gradient_loss | -0.000936     |
|    value_loss           | 128           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1554          |
|    time_elapsed         | 1030

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1564         |
|    time_elapsed         | 10369        |
|    total_timesteps      | 800768       |
| train/                  |              |
|    approx_kl            | 0.0011708979 |
|    clip_fraction        | 0.00547      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.241       |
|    explained_variance   | 0.862        |
|    learning_rate        | 1e-06        |
|    loss                 | 20.1         |
|    n_updates            | 15630        |
|    policy_gradient_loss | -0.00092     |
|    value_loss           | 55.3         |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1565          |
|    time_elapsed         | 10376         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1575         |
|    time_elapsed         | 10444        |
|    total_timesteps      | 806400       |
| train/                  |              |
|    approx_kl            | 0.0017814375 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.38        |
|    explained_variance   | -0.585       |
|    learning_rate        | 1e-06        |
|    loss                 | 8.5          |
|    n_updates            | 15740        |
|    policy_gradient_loss | -0.000576    |
|    value_loss           | 43.3         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1576         |
|    time_elapsed         | 10451        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1586         |
|    time_elapsed         | 10518        |
|    total_timesteps      | 812032       |
| train/                  |              |
|    approx_kl            | 0.0026202146 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.52        |
|    explained_variance   | 0.109        |
|    learning_rate        | 1e-06        |
|    loss                 | 0.158        |
|    n_updates            | 15850        |
|    policy_gradient_loss | -0.00197     |
|    value_loss           | 0.841        |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 77          |
|    iterations           | 1587        |
|    time_elapsed         | 10525       |
|    total_times

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1597         |
|    time_elapsed         | 10592        |
|    total_timesteps      | 817664       |
| train/                  |              |
|    approx_kl            | 0.0039905324 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.55        |
|    explained_variance   | -0.0648      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0509       |
|    n_updates            | 15960        |
|    policy_gradient_loss | -0.00371     |
|    value_loss           | 0.116        |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1598          |
|    time_elapsed         | 10599         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1608         |
|    time_elapsed         | 10666        |
|    total_timesteps      | 823296       |
| train/                  |              |
|    approx_kl            | 8.988334e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.186       |
|    explained_variance   | 0.133        |
|    learning_rate        | 1e-06        |
|    loss                 | 248          |
|    n_updates            | 16070        |
|    policy_gradient_loss | -0.000317    |
|    value_loss           | 624          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1609          |
|    time_elapsed         | 10673         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1619          |
|    time_elapsed         | 10740         |
|    total_timesteps      | 828928        |
| train/                  |               |
|    approx_kl            | 4.3341075e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.187        |
|    explained_variance   | 0.396         |
|    learning_rate        | 1e-06         |
|    loss                 | 498           |
|    n_updates            | 16180         |
|    policy_gradient_loss | -0.000127     |
|    value_loss           | 605           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1620          |
|    time_elapsed         | 1074

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1630          |
|    time_elapsed         | 10814         |
|    total_timesteps      | 834560        |
| train/                  |               |
|    approx_kl            | 0.00040464592 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.199        |
|    explained_variance   | 0.644         |
|    learning_rate        | 1e-06         |
|    loss                 | 124           |
|    n_updates            | 16290         |
|    policy_gradient_loss | -0.000122     |
|    value_loss           | 270           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1631          |
|    time_elapsed         | 1082

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1641         |
|    time_elapsed         | 10895        |
|    total_timesteps      | 840192       |
| train/                  |              |
|    approx_kl            | 3.181584e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.133       |
|    explained_variance   | 0.648        |
|    learning_rate        | 1e-06        |
|    loss                 | 520          |
|    n_updates            | 16400        |
|    policy_gradient_loss | -0.000166    |
|    value_loss           | 518          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1642          |
|    time_elapsed         | 10902         |
|    t

----------------------------------------
| time/                   |            |
|    fps                  | 77         |
|    iterations           | 1652       |
|    time_elapsed         | 10970      |
|    total_timesteps      | 845824     |
| train/                  |            |
|    approx_kl            | 0.00019572 |
|    clip_fraction        | 0          |
|    clip_range           | 0.2        |
|    entropy_loss         | -0.162     |
|    explained_variance   | 0.858      |
|    learning_rate        | 1e-06      |
|    loss                 | 140        |
|    n_updates            | 16510      |
|    policy_gradient_loss | 1.51e-05   |
|    value_loss           | 196        |
----------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1653          |
|    time_elapsed         | 10977         |
|    total_timesteps      | 846336        

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1663         |
|    time_elapsed         | 11047        |
|    total_timesteps      | 851456       |
| train/                  |              |
|    approx_kl            | 0.0002116703 |
|    clip_fraction        | 0.000391     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.139       |
|    explained_variance   | 0.772        |
|    learning_rate        | 1e-06        |
|    loss                 | 54.3         |
|    n_updates            | 16620        |
|    policy_gradient_loss | -0.000347    |
|    value_loss           | 150          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1664         |
|    time_elapsed         | 11054        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1674         |
|    time_elapsed         | 11120        |
|    total_timesteps      | 857088       |
| train/                  |              |
|    approx_kl            | 6.346498e-05 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.185       |
|    explained_variance   | 0.598        |
|    learning_rate        | 1e-06        |
|    loss                 | 61.9         |
|    n_updates            | 16730        |
|    policy_gradient_loss | -0.00013     |
|    value_loss           | 168          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1675         |
|    time_elapsed         | 11127        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1685          |
|    time_elapsed         | 11194         |
|    total_timesteps      | 862720        |
| train/                  |               |
|    approx_kl            | 0.00082932133 |
|    clip_fraction        | 0.00742       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.183        |
|    explained_variance   | 0.861         |
|    learning_rate        | 1e-06         |
|    loss                 | 49.1          |
|    n_updates            | 16840         |
|    policy_gradient_loss | -0.000135     |
|    value_loss           | 129           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1686          |
|    time_elapsed         | 1120

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1696         |
|    time_elapsed         | 11267        |
|    total_timesteps      | 868352       |
| train/                  |              |
|    approx_kl            | 0.0008046264 |
|    clip_fraction        | 0.00488      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.188       |
|    explained_variance   | 0.931        |
|    learning_rate        | 1e-06        |
|    loss                 | 41           |
|    n_updates            | 16950        |
|    policy_gradient_loss | -0.000459    |
|    value_loss           | 93.6         |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 77          |
|    iterations           | 1697        |
|    time_elapsed         | 11274       |
|    total_times

-------------------------------------------
| time/                   |               |
|    fps                  | 77            |
|    iterations           | 1707          |
|    time_elapsed         | 11343         |
|    total_timesteps      | 873984        |
| train/                  |               |
|    approx_kl            | 4.5025605e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.108        |
|    explained_variance   | 0.901         |
|    learning_rate        | 1e-06         |
|    loss                 | 158           |
|    n_updates            | 17060         |
|    policy_gradient_loss | -0.000233     |
|    value_loss           | 200           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1708         |
|    time_elapsed         | 11350   

------------------------------------------
| time/                   |              |
|    fps                  | 77           |
|    iterations           | 1718         |
|    time_elapsed         | 11419        |
|    total_timesteps      | 879616       |
| train/                  |              |
|    approx_kl            | 0.0012278231 |
|    clip_fraction        | 0.0104       |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.15        |
|    explained_variance   | 0.874        |
|    learning_rate        | 1e-06        |
|    loss                 | 24.5         |
|    n_updates            | 17170        |
|    policy_gradient_loss | -0.00046     |
|    value_loss           | 79           |
------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 77          |
|    iterations           | 1719        |
|    time_elapsed         | 11427       |
|    total_times

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1729         |
|    time_elapsed         | 11496        |
|    total_timesteps      | 885248       |
| train/                  |              |
|    approx_kl            | 0.0002473205 |
|    clip_fraction        | 0.000586     |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.193       |
|    explained_variance   | 0.893        |
|    learning_rate        | 1e-06        |
|    loss                 | 92           |
|    n_updates            | 17280        |
|    policy_gradient_loss | -0.000267    |
|    value_loss           | 160          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1730         |
|    time_elapsed         | 11503        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1740         |
|    time_elapsed         | 11573        |
|    total_timesteps      | 890880       |
| train/                  |              |
|    approx_kl            | 0.0015559227 |
|    clip_fraction        | 0.016        |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.192       |
|    explained_variance   | 0.819        |
|    learning_rate        | 1e-06        |
|    loss                 | 59.7         |
|    n_updates            | 17390        |
|    policy_gradient_loss | -0.00125     |
|    value_loss           | 195          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1741          |
|    time_elapsed         | 11580         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1751         |
|    time_elapsed         | 11650        |
|    total_timesteps      | 896512       |
| train/                  |              |
|    approx_kl            | 0.0001531206 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.242       |
|    explained_variance   | 0.364        |
|    learning_rate        | 1e-06        |
|    loss                 | 779          |
|    n_updates            | 17500        |
|    policy_gradient_loss | -0.000246    |
|    value_loss           | 608          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1752         |
|    time_elapsed         | 11657        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1762          |
|    time_elapsed         | 11727         |
|    total_timesteps      | 902144        |
| train/                  |               |
|    approx_kl            | 3.0749827e-05 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.256        |
|    explained_variance   | 0.798         |
|    learning_rate        | 1e-06         |
|    loss                 | 42.3          |
|    n_updates            | 17610         |
|    policy_gradient_loss | 0.000122      |
|    value_loss           | 132           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1763          |
|    time_elapsed         | 1173

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1773         |
|    time_elapsed         | 11803        |
|    total_timesteps      | 907776       |
| train/                  |              |
|    approx_kl            | 0.0008592156 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.194       |
|    explained_variance   | 0.498        |
|    learning_rate        | 1e-06        |
|    loss                 | 218          |
|    n_updates            | 17720        |
|    policy_gradient_loss | -0.000807    |
|    value_loss           | 555          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1774          |
|    time_elapsed         | 11810         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1784          |
|    time_elapsed         | 11879         |
|    total_timesteps      | 913408        |
| train/                  |               |
|    approx_kl            | 0.00042767427 |
|    clip_fraction        | 0.00313       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.264        |
|    explained_variance   | 0.804         |
|    learning_rate        | 1e-06         |
|    loss                 | 159           |
|    n_updates            | 17830         |
|    policy_gradient_loss | -0.000428     |
|    value_loss           | 310           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1785         |
|    time_elapsed         | 11886   

-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1795          |
|    time_elapsed         | 11956         |
|    total_timesteps      | 919040        |
| train/                  |               |
|    approx_kl            | 0.00068331684 |
|    clip_fraction        | 0.0125        |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.309        |
|    explained_variance   | 0.671         |
|    learning_rate        | 1e-06         |
|    loss                 | 81.5          |
|    n_updates            | 17940         |
|    policy_gradient_loss | -0.000969     |
|    value_loss           | 172           |
-------------------------------------------
-----------------------------------------
| time/                   |             |
|    fps                  | 76          |
|    iterations           | 1796        |
|    time_elapsed         | 11963       

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1806         |
|    time_elapsed         | 12033        |
|    total_timesteps      | 924672       |
| train/                  |              |
|    approx_kl            | 0.0016014678 |
|    clip_fraction        | 0.000391     |
|    clip_range           | 0.2          |
|    entropy_loss         | -1.53        |
|    explained_variance   | -0.0212      |
|    learning_rate        | 1e-06        |
|    loss                 | 0.0896       |
|    n_updates            | 18050        |
|    policy_gradient_loss | -0.00172     |
|    value_loss           | 0.26         |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1807         |
|    time_elapsed         | 12039        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1817         |
|    time_elapsed         | 12108        |
|    total_timesteps      | 930304       |
| train/                  |              |
|    approx_kl            | 0.0005181893 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.382       |
|    explained_variance   | 0.403        |
|    learning_rate        | 1e-06        |
|    loss                 | 334          |
|    n_updates            | 18160        |
|    policy_gradient_loss | -0.00154     |
|    value_loss           | 540          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1818          |
|    time_elapsed         | 12115         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1828         |
|    time_elapsed         | 12184        |
|    total_timesteps      | 935936       |
| train/                  |              |
|    approx_kl            | 0.0020000376 |
|    clip_fraction        | 0.00508      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.287       |
|    explained_variance   | 0.792        |
|    learning_rate        | 1e-06        |
|    loss                 | 80           |
|    n_updates            | 18270        |
|    policy_gradient_loss | -0.00186     |
|    value_loss           | 172          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1829          |
|    time_elapsed         | 12191         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1839          |
|    time_elapsed         | 12261         |
|    total_timesteps      | 941568        |
| train/                  |               |
|    approx_kl            | 0.00035487092 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.361        |
|    explained_variance   | 0.901         |
|    learning_rate        | 1e-06         |
|    loss                 | 79.6          |
|    n_updates            | 18380         |
|    policy_gradient_loss | -0.000296     |
|    value_loss           | 171           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1840          |
|    time_elapsed         | 1226

-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1850          |
|    time_elapsed         | 12336         |
|    total_timesteps      | 947200        |
| train/                  |               |
|    approx_kl            | 0.00035235623 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.411        |
|    explained_variance   | 0.715         |
|    learning_rate        | 1e-06         |
|    loss                 | 85            |
|    n_updates            | 18490         |
|    policy_gradient_loss | -0.000518     |
|    value_loss           | 233           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1851         |
|    time_elapsed         | 12343   

-----------------------------------------
| time/                   |             |
|    fps                  | 76          |
|    iterations           | 1861        |
|    time_elapsed         | 12410       |
|    total_timesteps      | 952832      |
| train/                  |             |
|    approx_kl            | 0.013083307 |
|    clip_fraction        | 0.0826      |
|    clip_range           | 0.2         |
|    entropy_loss         | -1.49       |
|    explained_variance   | 0.816       |
|    learning_rate        | 1e-06       |
|    loss                 | 46.1        |
|    n_updates            | 18600       |
|    policy_gradient_loss | -0.00876    |
|    value_loss           | 194         |
-----------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1862         |
|    time_elapsed         | 12417        |
|    total_timesteps      | 9

-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1872          |
|    time_elapsed         | 12483         |
|    total_timesteps      | 958464        |
| train/                  |               |
|    approx_kl            | 0.00088847615 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.294        |
|    explained_variance   | 0.745         |
|    learning_rate        | 1e-06         |
|    loss                 | 56.8          |
|    n_updates            | 18710         |
|    policy_gradient_loss | -0.00195      |
|    value_loss           | 161           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1873         |
|    time_elapsed         | 12490   

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1883         |
|    time_elapsed         | 12557        |
|    total_timesteps      | 964096       |
| train/                  |              |
|    approx_kl            | 0.0001313258 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.214       |
|    explained_variance   | 0.776        |
|    learning_rate        | 1e-06        |
|    loss                 | 96.2         |
|    n_updates            | 18820        |
|    policy_gradient_loss | -0.000263    |
|    value_loss           | 154          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1884         |
|    time_elapsed         | 12563        |
|    total_

-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1894          |
|    time_elapsed         | 12630         |
|    total_timesteps      | 969728        |
| train/                  |               |
|    approx_kl            | 0.00031122263 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.252        |
|    explained_variance   | 0.844         |
|    learning_rate        | 1e-06         |
|    loss                 | 169           |
|    n_updates            | 18930         |
|    policy_gradient_loss | -0.000721     |
|    value_loss           | 358           |
-------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1895          |
|    time_elapsed         | 1263

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1905         |
|    time_elapsed         | 12702        |
|    total_timesteps      | 975360       |
| train/                  |              |
|    approx_kl            | 0.0009789452 |
|    clip_fraction        | 0            |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.319       |
|    explained_variance   | 0.545        |
|    learning_rate        | 1e-06        |
|    loss                 | 270          |
|    n_updates            | 19040        |
|    policy_gradient_loss | -0.00117     |
|    value_loss           | 640          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1906          |
|    time_elapsed         | 12709         |
|    t

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1916         |
|    time_elapsed         | 12776        |
|    total_timesteps      | 980992       |
| train/                  |              |
|    approx_kl            | 0.0028122165 |
|    clip_fraction        | 0.00684      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.433       |
|    explained_variance   | 0.725        |
|    learning_rate        | 1e-06        |
|    loss                 | 168          |
|    n_updates            | 19150        |
|    policy_gradient_loss | -0.00148     |
|    value_loss           | 414          |
------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1917         |
|    time_elapsed         | 12783        |
|    total_

------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1927         |
|    time_elapsed         | 12851        |
|    total_timesteps      | 986624       |
| train/                  |              |
|    approx_kl            | 0.0016918876 |
|    clip_fraction        | 0.00352      |
|    clip_range           | 0.2          |
|    entropy_loss         | -0.294       |
|    explained_variance   | 0.688        |
|    learning_rate        | 1e-06        |
|    loss                 | 90.8         |
|    n_updates            | 19260        |
|    policy_gradient_loss | -0.000974    |
|    value_loss           | 194          |
------------------------------------------
-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1928          |
|    time_elapsed         | 12858         |
|    t

-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1938          |
|    time_elapsed         | 12924         |
|    total_timesteps      | 992256        |
| train/                  |               |
|    approx_kl            | 0.00080803444 |
|    clip_fraction        | 0.00762       |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.195        |
|    explained_variance   | 0.881         |
|    learning_rate        | 1e-06         |
|    loss                 | 57.5          |
|    n_updates            | 19370         |
|    policy_gradient_loss | -0.000569     |
|    value_loss           | 129           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1939         |
|    time_elapsed         | 12931   

-------------------------------------------
| time/                   |               |
|    fps                  | 76            |
|    iterations           | 1949          |
|    time_elapsed         | 12997         |
|    total_timesteps      | 997888        |
| train/                  |               |
|    approx_kl            | 0.00036129565 |
|    clip_fraction        | 0             |
|    clip_range           | 0.2           |
|    entropy_loss         | -0.298        |
|    explained_variance   | 0.803         |
|    learning_rate        | 1e-06         |
|    loss                 | 57.9          |
|    n_updates            | 19480         |
|    policy_gradient_loss | -0.000265     |
|    value_loss           | 144           |
-------------------------------------------
------------------------------------------
| time/                   |              |
|    fps                  | 76           |
|    iterations           | 1950         |
|    time_elapsed         | 13004   

<stable_baselines3.ppo.ppo.PPO at 0x269a3a744c0>

In [12]:
model.save('thisisatestmodel')

In [9]:
model = PPO.load('./train/best_model_1000000')
model

<stable_baselines3.ppo.ppo.PPO at 0x1df2f4b8760>

In [10]:
state = env.reset()

In [11]:
# Start the game 
state = env.reset()
# Loop through the game
counter = 0
while True: 
    action, _ = model.predict(state)
    state, reward, done, info = env.step(action)
    env.render()

