# Stable-baselines algorithms experiment iteration

Algorithms
* A2C (no replay memory)
* ACER
* ACKTR
* DDPG (continuous only)
* DQN
* HER
* GAIL
* PPO
* SAC (continuous only)
* TD3 (continuous only)
* TRPO

In [1]:
import base64
import IPython
import imageio

def embed_mp4(filename):
    """Embeds an mp4 file in the notebook."""
    video = open(filename,'rb').read()
    b64 = base64.b64encode(video)
    tag = '''
    <video width="640" height="480" controls>
    <source src="data:video/mp4;base64,{0}" type="video/mp4">
    Your browser does not support the video tag.
    </video>'''.format(b64.decode())

    return IPython.display.HTML(tag)

def record_game(model, env, num_episodes=5, video_filename='video.mp4'):
    with imageio.get_writer(video_filename, fps=60) as video:
        for _ in range(num_episodes):
            obs = env.reset()
            done = False
            total_reward = 0
            video.append_data(env.render('rgb_array'))

            while not done:
                action, _steps = model.predict(obs)
                obs, reward, done, info = env.step(action)
                total_reward += reward
                video.append_data(env.render('rgb_array'))

            print("score:", total_reward)

In [2]:
import os
import gym
import slimevolleygym
from slimevolleygym import SurvivalRewardEnv

from stable_baselines.common.policies import MlpPolicy
from stable_baselines import logger
from stable_baselines.common.callbacks import EvalCallback

from stable_baselines.ppo1 import PPO1
from stable_baselines import A2C, ACER, ACKTR, DQN, HER, GAIL, TRPO

algo = {
    'a2c': A2C,
    'acer': ACER,
    'acktr': ACKTR,
    'dqn': DQN,
    'her': HER,
    'gail': GAIL,
    'trpo': TRPO,
}
trained_model = {}

The TensorFlow contrib module will not be included in TensorFlow 2.0.
For more information, please see:
  * https://github.com/tensorflow/community/blob/master/rfcs/20180907-contrib-sunset.md
  * https://github.com/tensorflow/addons
  * https://github.com/tensorflow/io (for I/O related ops)
If you depend on functionality not listed there, please file an issue.



In [3]:
def experiment(model_str, timesteps=50_000_000):
    NUM_TIMESTEPS = int(timesteps)
    SEED = 721
    EVAL_FREQ = 25000
    EVAL_EPISODES = 10  # was 1000
    LOGDIR = "sb-" + model_str

    logger.configure(folder=LOGDIR)
    env = gym.make("SlimeVolley-v0")
    env.seed(SEED)

    model = algo[model_str](MlpPolicy, env, verbose=2)
    eval_callback = EvalCallback(env, best_model_save_path=LOGDIR, log_path=LOGDIR, eval_freq=EVAL_FREQ, n_eval_episodes=EVAL_EPISODES)
    model.learn(total_timesteps=NUM_TIMESTEPS, callback=eval_callback)
    model.save(os.path.join(LOGDIR, "final_model")) # probably never get to this point.
    env.close()
    
    trained_model[model_str] = model

In [None]:
experiment('a2c')

Logging to sb-a2c
Wrapping the env in a DummyVecEnv.




Instructions for updating:
Use keras.layers.flatten instead.
Instructions for updating:
Please use `layer.__call__` method instead.


Instructions for updating:
Use tf.where in 2.0, which has the same broadcast rule as np.where




Instructions for updating:
Call initializer instance with the dtype argument instead of passing it to the constructor


----------------------------------
| explained_variance | -1.41e+04 |
| fps                | 28        |
| nupdates           | 1         |
| policy_entropy     | 2.08      |
| total_timesteps    | 5         |
| value_loss         | 0.0281    |
----------------------------------
---------------------------------
| explained_variance | -372     |
| fps                | 625      |
| nupdates           | 100      |
| policy_entropy     | 2.08     |
| total_timesteps    | 500      |
| value_loss         | 0.0896   |
---------------------------------
----------------------------------
| ex

---------------------------------
| explained_variance | -7.05    |
| fps                | 854      |
| nupdates           | 1600     |
| policy_entropy     | 2.06     |
| total_timesteps    | 8000     |
| value_loss         | 0.00383  |
---------------------------------
---------------------------------
| explained_variance | -9.28    |
| fps                | 850      |
| nupdates           | 1700     |
| policy_entropy     | 2.04     |
| total_timesteps    | 8500     |
| value_loss         | 0.0041   |
---------------------------------
---------------------------------
| explained_variance | -49.1    |
| fps                | 833      |
| nupdates           | 1800     |
| policy_entropy     | 2.07     |
| total_timesteps    | 9000     |
| value_loss         | 0.00476  |
---------------------------------
---------------------------------
| explained_variance | -17.2    |
| fps                | 804      |
| nupdates           | 1900     |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.706    |
| fps                | 898      |
| nupdates           | 4700     |
| policy_entropy     | 2.05     |
| total_timesteps    | 23500    |
| value_loss         | 4.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.21    |
| fps                | 901      |
| nupdates           | 4800     |
| policy_entropy     | 2.05     |
| total_timesteps    | 24000    |
| value_loss         | 0.000164 |
---------------------------------
---------------------------------
| explained_variance | -27.1    |
| fps                | 901      |
| nupdates           | 4900     |
| policy_entropy     | 2.07     |
| total_timesteps    | 24500    |
| value_loss         | 0.000281 |
---------------------------------
Eval num_timesteps=25000, episode_reward=-4.80 +/- 0.40
Episode length: 572.20 +/- 66.50
New best mean reward!
---------------------------------
| explained_variance | -6.44    |
| fps

---------------------------------
| explained_variance | -24.7    |
| fps                | 843      |
| nupdates           | 7700     |
| policy_entropy     | 2.06     |
| total_timesteps    | 38500    |
| value_loss         | 0.00102  |
---------------------------------
---------------------------------
| explained_variance | -89.7    |
| fps                | 844      |
| nupdates           | 7800     |
| policy_entropy     | 2.05     |
| total_timesteps    | 39000    |
| value_loss         | 0.000984 |
---------------------------------
---------------------------------
| explained_variance | 0.493    |
| fps                | 845      |
| nupdates           | 7900     |
| policy_entropy     | 2.06     |
| total_timesteps    | 39500    |
| value_loss         | 0.000148 |
---------------------------------
---------------------------------
| explained_variance | -0.0151  |
| fps                | 846      |
| nupdates           | 8000     |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -1.52    |
| fps                | 814      |
| nupdates           | 10700    |
| policy_entropy     | 2.03     |
| total_timesteps    | 53500    |
| value_loss         | 0.000229 |
---------------------------------
---------------------------------
| explained_variance | -8.61    |
| fps                | 814      |
| nupdates           | 10800    |
| policy_entropy     | 2.05     |
| total_timesteps    | 54000    |
| value_loss         | 0.000181 |
---------------------------------
---------------------------------
| explained_variance | -0.0845  |
| fps                | 815      |
| nupdates           | 10900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 54500    |
| value_loss         | 3.54e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 817      |
| nupdates           | 11000    |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -1.78    |
| fps                | 847      |
| nupdates           | 13800    |
| policy_entropy     | 2.06     |
| total_timesteps    | 69000    |
| value_loss         | 0.883    |
---------------------------------
---------------------------------
| explained_variance | 0.267    |
| fps                | 847      |
| nupdates           | 13900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 69500    |
| value_loss         | 0.000424 |
---------------------------------
---------------------------------
| explained_variance | -12      |
| fps                | 848      |
| nupdates           | 14000    |
| policy_entropy     | 2.07     |
| total_timesteps    | 70000    |
| value_loss         | 0.000953 |
---------------------------------
---------------------------------
| explained_variance | -0.849   |
| fps                | 849      |
| nupdates           | 14100    |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -2.07    |
| fps                | 833      |
| nupdates           | 16800    |
| policy_entropy     | 2.03     |
| total_timesteps    | 84000    |
| value_loss         | 6.11e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.297   |
| fps                | 834      |
| nupdates           | 16900    |
| policy_entropy     | 2.03     |
| total_timesteps    | 84500    |
| value_loss         | 0.00134  |
---------------------------------
---------------------------------
| explained_variance | 0.436    |
| fps                | 834      |
| nupdates           | 17000    |
| policy_entropy     | 1.94     |
| total_timesteps    | 85000    |
| value_loss         | 0.00138  |
---------------------------------
---------------------------------
| explained_variance | -5.85    |
| fps                | 835      |
| nupdates           | 17100    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -84.4    |
| fps                | 850      |
| nupdates           | 19900    |
| policy_entropy     | 2.05     |
| total_timesteps    | 99500    |
| value_loss         | 0.000699 |
---------------------------------
Eval num_timesteps=100000, episode_reward=-4.80 +/- 0.40
Episode length: 630.50 +/- 122.29
---------------------------------
| explained_variance | -0.757   |
| fps                | 825      |
| nupdates           | 20000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 100000   |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | -2.96    |
| fps                | 825      |
| nupdates           | 20100    |
| policy_entropy     | 2.04     |
| total_timesteps    | 100500   |
| value_loss         | 0.00105  |
---------------------------------
---------------------------------
| explained_variance | 0.366    |
| fps                | 82

---------------------------------
| explained_variance | -9.07    |
| fps                | 838      |
| nupdates           | 22900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 114500   |
| value_loss         | 0.000327 |
---------------------------------
---------------------------------
| explained_variance | -29.3    |
| fps                | 839      |
| nupdates           | 23000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 115000   |
| value_loss         | 0.000777 |
---------------------------------
---------------------------------
| explained_variance | -57.5    |
| fps                | 839      |
| nupdates           | 23100    |
| policy_entropy     | 2.07     |
| total_timesteps    | 115500   |
| value_loss         | 0.0014   |
---------------------------------
---------------------------------
| explained_variance | -26.3    |
| fps                | 840      |
| nupdates           | 23200    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.628    |
| fps                | 828      |
| nupdates           | 25900    |
| policy_entropy     | 2.05     |
| total_timesteps    | 129500   |
| value_loss         | 0.00058  |
---------------------------------
---------------------------------
| explained_variance | 0.0645   |
| fps                | 828      |
| nupdates           | 26000    |
| policy_entropy     | 2.08     |
| total_timesteps    | 130000   |
| value_loss         | 0.000423 |
---------------------------------
---------------------------------
| explained_variance | -4.8     |
| fps                | 829      |
| nupdates           | 26100    |
| policy_entropy     | 2.06     |
| total_timesteps    | 130500   |
| value_loss         | 0.000797 |
---------------------------------
---------------------------------
| explained_variance | -1.16    |
| fps                | 829      |
| nupdates           | 26200    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.506   |
| fps                | 844      |
| nupdates           | 29000    |
| policy_entropy     | 2.07     |
| total_timesteps    | 145000   |
| value_loss         | 0.000146 |
---------------------------------
---------------------------------
| explained_variance | 0.969    |
| fps                | 844      |
| nupdates           | 29100    |
| policy_entropy     | 2.07     |
| total_timesteps    | 145500   |
| value_loss         | 1.93e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.49     |
| fps                | 845      |
| nupdates           | 29200    |
| policy_entropy     | 2.06     |
| total_timesteps    | 146000   |
| value_loss         | 5.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.682   |
| fps                | 845      |
| nupdates           | 29300    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.00735  |
| fps                | 841      |
| nupdates           | 32000    |
| policy_entropy     | 2.02     |
| total_timesteps    | 160000   |
| value_loss         | 0.000284 |
---------------------------------
---------------------------------
| explained_variance | 0.762    |
| fps                | 841      |
| nupdates           | 32100    |
| policy_entropy     | 2.01     |
| total_timesteps    | 160500   |
| value_loss         | 0.000246 |
---------------------------------
---------------------------------
| explained_variance | 0.406    |
| fps                | 841      |
| nupdates           | 32200    |
| policy_entropy     | 2.03     |
| total_timesteps    | 161000   |
| value_loss         | 4.6e-05  |
---------------------------------
---------------------------------
| explained_variance | -16.4    |
| fps                | 842      |
| nupdates           | 32300    |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | -1.82    |
| fps                | 837      |
| nupdates           | 35100    |
| policy_entropy     | 2.07     |
| total_timesteps    | 175500   |
| value_loss         | 0.000323 |
---------------------------------
---------------------------------
| explained_variance | 0.982    |
| fps                | 837      |
| nupdates           | 35200    |
| policy_entropy     | 2.05     |
| total_timesteps    | 176000   |
| value_loss         | 6.46e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.747   |
| fps                | 838      |
| nupdates           | 35300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 176500   |
| value_loss         | 0.000141 |
---------------------------------
---------------------------------
| explained_variance | 0.948    |
| fps                | 838      |
| nupdates           | 35400    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.889    |
| fps                | 846      |
| nupdates           | 38200    |
| policy_entropy     | 1.93     |
| total_timesteps    | 191000   |
| value_loss         | 6.17e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.486   |
| fps                | 846      |
| nupdates           | 38300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 191500   |
| value_loss         | 0.000165 |
---------------------------------
---------------------------------
| explained_variance | 0.303    |
| fps                | 847      |
| nupdates           | 38400    |
| policy_entropy     | 2.07     |
| total_timesteps    | 192000   |
| value_loss         | 6.08e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.876   |
| fps                | 847      |
| nupdates           | 38500    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.789    |
| fps                | 841      |
| nupdates           | 41200    |
| policy_entropy     | 2.05     |
| total_timesteps    | 206000   |
| value_loss         | 0.000773 |
---------------------------------
---------------------------------
| explained_variance | -112     |
| fps                | 841      |
| nupdates           | 41300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 206500   |
| value_loss         | 0.00168  |
---------------------------------
---------------------------------
| explained_variance | 0.272    |
| fps                | 841      |
| nupdates           | 41400    |
| policy_entropy     | 1.97     |
| total_timesteps    | 207000   |
| value_loss         | 0.22     |
---------------------------------
---------------------------------
| explained_variance | -0.567   |
| fps                | 842      |
| nupdates           | 41500    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -12      |
| fps                | 850      |
| nupdates           | 44300    |
| policy_entropy     | 2.08     |
| total_timesteps    | 221500   |
| value_loss         | 0.00119  |
---------------------------------
---------------------------------
| explained_variance | -3.8     |
| fps                | 850      |
| nupdates           | 44400    |
| policy_entropy     | 2.08     |
| total_timesteps    | 222000   |
| value_loss         | 0.00119  |
---------------------------------
---------------------------------
| explained_variance | 0.355    |
| fps                | 850      |
| nupdates           | 44500    |
| policy_entropy     | 1.97     |
| total_timesteps    | 222500   |
| value_loss         | 0.00011  |
---------------------------------
---------------------------------
| explained_variance | 0.97     |
| fps                | 851      |
| nupdates           | 44600    |
| policy_entropy     | 1.94     |
| total_timest

---------------------------------
| explained_variance | 0.892    |
| fps                | 846      |
| nupdates           | 47300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 236500   |
| value_loss         | 1.06e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.97    |
| fps                | 847      |
| nupdates           | 47400    |
| policy_entropy     | 2.07     |
| total_timesteps    | 237000   |
| value_loss         | 0.000208 |
---------------------------------
---------------------------------
| explained_variance | 0.445    |
| fps                | 847      |
| nupdates           | 47500    |
| policy_entropy     | 2.07     |
| total_timesteps    | 237500   |
| value_loss         | 0.000208 |
---------------------------------
---------------------------------
| explained_variance | -0.114   |
| fps                | 847      |
| nupdates           | 47600    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.387   |
| fps                | 841      |
| nupdates           | 50300    |
| policy_entropy     | 2.06     |
| total_timesteps    | 251500   |
| value_loss         | 0.000393 |
---------------------------------
---------------------------------
| explained_variance | 0.549    |
| fps                | 842      |
| nupdates           | 50400    |
| policy_entropy     | 2.06     |
| total_timesteps    | 252000   |
| value_loss         | 0.00214  |
---------------------------------
---------------------------------
| explained_variance | 0.355    |
| fps                | 842      |
| nupdates           | 50500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 252500   |
| value_loss         | 0.000257 |
---------------------------------
---------------------------------
| explained_variance | -30.6    |
| fps                | 842      |
| nupdates           | 50600    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -3.63    |
| fps                | 848      |
| nupdates           | 53400    |
| policy_entropy     | 2.07     |
| total_timesteps    | 267000   |
| value_loss         | 0.000463 |
---------------------------------
---------------------------------
| explained_variance | -2.5     |
| fps                | 849      |
| nupdates           | 53500    |
| policy_entropy     | 2.07     |
| total_timesteps    | 267500   |
| value_loss         | 0.000493 |
---------------------------------
---------------------------------
| explained_variance | 0.432    |
| fps                | 849      |
| nupdates           | 53600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 268000   |
| value_loss         | 0.000226 |
---------------------------------
---------------------------------
| explained_variance | 0.725    |
| fps                | 849      |
| nupdates           | 53700    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.493   |
| fps                | 844      |
| nupdates           | 56400    |
| policy_entropy     | 2.08     |
| total_timesteps    | 282000   |
| value_loss         | 3.78e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.9     |
| fps                | 844      |
| nupdates           | 56500    |
| policy_entropy     | 2.07     |
| total_timesteps    | 282500   |
| value_loss         | 0.000593 |
---------------------------------
---------------------------------
| explained_variance | 0.535    |
| fps                | 844      |
| nupdates           | 56600    |
| policy_entropy     | 2.08     |
| total_timesteps    | 283000   |
| value_loss         | 0.000189 |
---------------------------------
---------------------------------
| explained_variance | -2.07    |
| fps                | 844      |
| nupdates           | 56700    |
| policy_entropy     | 2.07     |
| total_timest

----------------------------------
| explained_variance | -1.47e+04 |
| fps                | 849       |
| nupdates           | 59500     |
| policy_entropy     | 2.07      |
| total_timesteps    | 297500    |
| value_loss         | 0.182     |
----------------------------------
---------------------------------
| explained_variance | -45.9    |
| fps                | 849      |
| nupdates           | 59600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 298000   |
| value_loss         | 0.00656  |
---------------------------------
---------------------------------
| explained_variance | -6.1     |
| fps                | 850      |
| nupdates           | 59700    |
| policy_entropy     | 2.07     |
| total_timesteps    | 298500   |
| value_loss         | 0.000811 |
---------------------------------
---------------------------------
| explained_variance | -3       |
| fps                | 850      |
| nupdates           | 59800    |
| policy_entropy     | 2.08     |
| tota

---------------------------------
| explained_variance | 0.91     |
| fps                | 845      |
| nupdates           | 62500    |
| policy_entropy     | 2.04     |
| total_timesteps    | 312500   |
| value_loss         | 0.000104 |
---------------------------------
---------------------------------
| explained_variance | 0.719    |
| fps                | 845      |
| nupdates           | 62600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 313000   |
| value_loss         | 8.6e-05  |
---------------------------------
---------------------------------
| explained_variance | -40.9    |
| fps                | 846      |
| nupdates           | 62700    |
| policy_entropy     | 2.07     |
| total_timesteps    | 313500   |
| value_loss         | 0.00619  |
---------------------------------
---------------------------------
| explained_variance | -11.9    |
| fps                | 846      |
| nupdates           | 62800    |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.275    |
| fps                | 841      |
| nupdates           | 65500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 327500   |
| value_loss         | 9.26e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.99    |
| fps                | 841      |
| nupdates           | 65600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 328000   |
| value_loss         | 0.00138  |
---------------------------------
---------------------------------
| explained_variance | -15.9    |
| fps                | 841      |
| nupdates           | 65700    |
| policy_entropy     | 2.07     |
| total_timesteps    | 328500   |
| value_loss         | 0.000653 |
---------------------------------
---------------------------------
| explained_variance | -0.763   |
| fps                | 842      |
| nupdates           | 65800    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.328    |
| fps                | 846      |
| nupdates           | 68600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 343000   |
| value_loss         | 0.00038  |
---------------------------------
---------------------------------
| explained_variance | 0.951    |
| fps                | 846      |
| nupdates           | 68700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 343500   |
| value_loss         | 1.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.809    |
| fps                | 847      |
| nupdates           | 68800    |
| policy_entropy     | 2.06     |
| total_timesteps    | 344000   |
| value_loss         | 5.2e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.466    |
| fps                | 847      |
| nupdates           | 68900    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -8.04    |
| fps                | 843      |
| nupdates           | 71600    |
| policy_entropy     | 2.04     |
| total_timesteps    | 358000   |
| value_loss         | 0.00039  |
---------------------------------
---------------------------------
| explained_variance | -1.05    |
| fps                | 843      |
| nupdates           | 71700    |
| policy_entropy     | 2.05     |
| total_timesteps    | 358500   |
| value_loss         | 0.00111  |
---------------------------------
---------------------------------
| explained_variance | -2.12    |
| fps                | 844      |
| nupdates           | 71800    |
| policy_entropy     | 2.05     |
| total_timesteps    | 359000   |
| value_loss         | 0.000553 |
---------------------------------
---------------------------------
| explained_variance | -0.467   |
| fps                | 844      |
| nupdates           | 71900    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.739    |
| fps                | 848      |
| nupdates           | 74700    |
| policy_entropy     | 2.07     |
| total_timesteps    | 373500   |
| value_loss         | 0.000309 |
---------------------------------
---------------------------------
| explained_variance | 0.836    |
| fps                | 848      |
| nupdates           | 74800    |
| policy_entropy     | 2.06     |
| total_timesteps    | 374000   |
| value_loss         | 1.26e-05 |
---------------------------------
---------------------------------
| explained_variance | -37.5    |
| fps                | 848      |
| nupdates           | 74900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 374500   |
| value_loss         | 0.000424 |
---------------------------------
Eval num_timesteps=375000, episode_reward=-5.00 +/- 0.00
Episode length: 593.80 +/- 83.72
---------------------------------
| explained_variance | 0.857    |
| fps                | 841

---------------------------------
| explained_variance | 0.954    |
| fps                | 845      |
| nupdates           | 77700    |
| policy_entropy     | 2.07     |
| total_timesteps    | 388500   |
| value_loss         | 4.22e-05 |
---------------------------------
---------------------------------
| explained_variance | -5.24    |
| fps                | 845      |
| nupdates           | 77800    |
| policy_entropy     | 2.07     |
| total_timesteps    | 389000   |
| value_loss         | 0.00151  |
---------------------------------
---------------------------------
| explained_variance | 0.487    |
| fps                | 845      |
| nupdates           | 77900    |
| policy_entropy     | 2.06     |
| total_timesteps    | 389500   |
| value_loss         | 0.000314 |
---------------------------------
---------------------------------
| explained_variance | -2.42    |
| fps                | 846      |
| nupdates           | 78000    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -57.4    |
| fps                | 843      |
| nupdates           | 80700    |
| policy_entropy     | 2.07     |
| total_timesteps    | 403500   |
| value_loss         | 0.000669 |
---------------------------------
---------------------------------
| explained_variance | -0.901   |
| fps                | 843      |
| nupdates           | 80800    |
| policy_entropy     | 2.08     |
| total_timesteps    | 404000   |
| value_loss         | 5.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.278    |
| fps                | 843      |
| nupdates           | 80900    |
| policy_entropy     | 2.06     |
| total_timesteps    | 404500   |
| value_loss         | 0.00111  |
---------------------------------
---------------------------------
| explained_variance | 0.647    |
| fps                | 843      |
| nupdates           | 81000    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.988    |
| fps                | 847      |
| nupdates           | 83800    |
| policy_entropy     | 1.93     |
| total_timesteps    | 419000   |
| value_loss         | 0.00264  |
---------------------------------
---------------------------------
| explained_variance | -218     |
| fps                | 847      |
| nupdates           | 83900    |
| policy_entropy     | 2.06     |
| total_timesteps    | 419500   |
| value_loss         | 0.00292  |
---------------------------------
---------------------------------
| explained_variance | 0.567    |
| fps                | 847      |
| nupdates           | 84000    |
| policy_entropy     | 2.07     |
| total_timesteps    | 420000   |
| value_loss         | 6.21e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.626   |
| fps                | 848      |
| nupdates           | 84100    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -61.3    |
| fps                | 845      |
| nupdates           | 86800    |
| policy_entropy     | 2.06     |
| total_timesteps    | 434000   |
| value_loss         | 0.00499  |
---------------------------------
---------------------------------
| explained_variance | -0.0292  |
| fps                | 846      |
| nupdates           | 86900    |
| policy_entropy     | 2.06     |
| total_timesteps    | 434500   |
| value_loss         | 0.0004   |
---------------------------------
---------------------------------
| explained_variance | 0.566    |
| fps                | 846      |
| nupdates           | 87000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 435000   |
| value_loss         | 0.000163 |
---------------------------------
---------------------------------
| explained_variance | -0.984   |
| fps                | 846      |
| nupdates           | 87100    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.482    |
| fps                | 849      |
| nupdates           | 89900    |
| policy_entropy     | 1.95     |
| total_timesteps    | 449500   |
| value_loss         | 9.77e-05 |
---------------------------------
Eval num_timesteps=450000, episode_reward=-4.90 +/- 0.30
Episode length: 554.00 +/- 97.46
---------------------------------
| explained_variance | 0.956    |
| fps                | 844      |
| nupdates           | 90000    |
| policy_entropy     | 1.62     |
| total_timesteps    | 450000   |
| value_loss         | 1.6e-05  |
---------------------------------
---------------------------------
| explained_variance | -1.61    |
| fps                | 844      |
| nupdates           | 90100    |
| policy_entropy     | 2.06     |
| total_timesteps    | 450500   |
| value_loss         | 6.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.454    |
| fps                | 844

---------------------------------
| explained_variance | -0.406   |
| fps                | 846      |
| nupdates           | 92900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 464500   |
| value_loss         | 2.62e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.836    |
| fps                | 846      |
| nupdates           | 93000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 465000   |
| value_loss         | 0.00013  |
---------------------------------
---------------------------------
| explained_variance | 0.936    |
| fps                | 846      |
| nupdates           | 93100    |
| policy_entropy     | 2.05     |
| total_timesteps    | 465500   |
| value_loss         | 0.000152 |
---------------------------------
---------------------------------
| explained_variance | -6.16    |
| fps                | 846      |
| nupdates           | 93200    |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.893    |
| fps                | 844      |
| nupdates           | 95900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 479500   |
| value_loss         | 5.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.922    |
| fps                | 844      |
| nupdates           | 96000    |
| policy_entropy     | 2.07     |
| total_timesteps    | 480000   |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | 0.842    |
| fps                | 844      |
| nupdates           | 96100    |
| policy_entropy     | 2.03     |
| total_timesteps    | 480500   |
| value_loss         | 0.0285   |
---------------------------------
---------------------------------
| explained_variance | 0.467    |
| fps                | 845      |
| nupdates           | 96200    |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.616   |
| fps                | 848      |
| nupdates           | 99000    |
| policy_entropy     | 1.98     |
| total_timesteps    | 495000   |
| value_loss         | 5.59e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.502    |
| fps                | 848      |
| nupdates           | 99100    |
| policy_entropy     | 2.01     |
| total_timesteps    | 495500   |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | -11.1    |
| fps                | 848      |
| nupdates           | 99200    |
| policy_entropy     | 2.03     |
| total_timesteps    | 496000   |
| value_loss         | 0.000734 |
---------------------------------
---------------------------------
| explained_variance | -2.12    |
| fps                | 848      |
| nupdates           | 99300    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.595    |
| fps                | 845      |
| nupdates           | 102000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 510000   |
| value_loss         | 3.06e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.422   |
| fps                | 845      |
| nupdates           | 102100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 510500   |
| value_loss         | 0.000741 |
---------------------------------
---------------------------------
| explained_variance | -1.13    |
| fps                | 845      |
| nupdates           | 102200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 511000   |
| value_loss         | 0.000291 |
---------------------------------
---------------------------------
| explained_variance | 0.376    |
| fps                | 846      |
| nupdates           | 102300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0189  |
| fps                | 844      |
| nupdates           | 105100   |
| policy_entropy     | 2.02     |
| total_timesteps    | 525500   |
| value_loss         | 0.269    |
---------------------------------
---------------------------------
| explained_variance | 0.644    |
| fps                | 844      |
| nupdates           | 105200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 526000   |
| value_loss         | 8.66e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.703    |
| fps                | 845      |
| nupdates           | 105300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 526500   |
| value_loss         | 0.000212 |
---------------------------------
---------------------------------
| explained_variance | -0.0542  |
| fps                | 845      |
| nupdates           | 105400   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.946    |
| fps                | 849      |
| nupdates           | 108200   |
| policy_entropy     | 2        |
| total_timesteps    | 541000   |
| value_loss         | 3.63e-05 |
---------------------------------
---------------------------------
| explained_variance | -10.3    |
| fps                | 849      |
| nupdates           | 108300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 541500   |
| value_loss         | 0.000246 |
---------------------------------
---------------------------------
| explained_variance | -1.31    |
| fps                | 849      |
| nupdates           | 108400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 542000   |
| value_loss         | 0.000123 |
---------------------------------
---------------------------------
| explained_variance | -63.3    |
| fps                | 849      |
| nupdates           | 108500   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.208    |
| fps                | 847      |
| nupdates           | 111200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 556000   |
| value_loss         | 0.00028  |
---------------------------------
---------------------------------
| explained_variance | -2.01    |
| fps                | 848      |
| nupdates           | 111300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 556500   |
| value_loss         | 0.00029  |
---------------------------------
---------------------------------
| explained_variance | -2.88    |
| fps                | 848      |
| nupdates           | 111400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 557000   |
| value_loss         | 5.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.558    |
| fps                | 848      |
| nupdates           | 111500   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.438    |
| fps                | 852      |
| nupdates           | 114300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 571500   |
| value_loss         | 7.64e-05 |
---------------------------------
---------------------------------
| explained_variance | -5.67    |
| fps                | 852      |
| nupdates           | 114400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 572000   |
| value_loss         | 0.000485 |
---------------------------------
---------------------------------
| explained_variance | -2.43    |
| fps                | 852      |
| nupdates           | 114500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 572500   |
| value_loss         | 0.000272 |
---------------------------------
---------------------------------
| explained_variance | 0.394    |
| fps                | 852      |
| nupdates           | 114600   |
| policy_entropy     | 1.97     |
| total_timest

---------------------------------
| explained_variance | 0.776    |
| fps                | 851      |
| nupdates           | 117300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 586500   |
| value_loss         | 4.39e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 851      |
| nupdates           | 117400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 587000   |
| value_loss         | 1.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.875   |
| fps                | 851      |
| nupdates           | 117500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 587500   |
| value_loss         | 8.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -20.1    |
| fps                | 851      |
| nupdates           | 117600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.01    |
| fps                | 850      |
| nupdates           | 120300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 601500   |
| value_loss         | 3.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.687    |
| fps                | 850      |
| nupdates           | 120400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 602000   |
| value_loss         | 0.000373 |
---------------------------------
---------------------------------
| explained_variance | 0.418    |
| fps                | 850      |
| nupdates           | 120500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 602500   |
| value_loss         | 1.99e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.57    |
| fps                | 850      |
| nupdates           | 120600   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -34.3    |
| fps                | 853      |
| nupdates           | 123400   |
| policy_entropy     | 2.02     |
| total_timesteps    | 617000   |
| value_loss         | 0.0014   |
---------------------------------
---------------------------------
| explained_variance | -0.191   |
| fps                | 854      |
| nupdates           | 123500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 617500   |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | -15.9    |
| fps                | 854      |
| nupdates           | 123600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 618000   |
| value_loss         | 0.00154  |
---------------------------------
---------------------------------
| explained_variance | -0.84    |
| fps                | 854      |
| nupdates           | 123700   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.0909   |
| fps                | 854      |
| nupdates           | 126400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 632000   |
| value_loss         | 0.000334 |
---------------------------------
---------------------------------
| explained_variance | 0.0461   |
| fps                | 854      |
| nupdates           | 126500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 632500   |
| value_loss         | 2.71e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.42    |
| fps                | 854      |
| nupdates           | 126600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 633000   |
| value_loss         | 0.000271 |
---------------------------------
---------------------------------
| explained_variance | 0.769    |
| fps                | 854      |
| nupdates           | 126700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.885    |
| fps                | 857      |
| nupdates           | 129500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 647500   |
| value_loss         | 0.000512 |
---------------------------------
---------------------------------
| explained_variance | -0.739   |
| fps                | 857      |
| nupdates           | 129600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 648000   |
| value_loss         | 0.00153  |
---------------------------------
---------------------------------
| explained_variance | -0.447   |
| fps                | 857      |
| nupdates           | 129700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 648500   |
| value_loss         | 0.000769 |
---------------------------------
---------------------------------
| explained_variance | -0.0483  |
| fps                | 857      |
| nupdates           | 129800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -14.1    |
| fps                | 856      |
| nupdates           | 132500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 662500   |
| value_loss         | 4.26e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.24    |
| fps                | 856      |
| nupdates           | 132600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 663000   |
| value_loss         | 0.00061  |
---------------------------------
---------------------------------
| explained_variance | 0.616    |
| fps                | 856      |
| nupdates           | 132700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 663500   |
| value_loss         | 0.000274 |
---------------------------------
---------------------------------
| explained_variance | 0.807    |
| fps                | 856      |
| nupdates           | 132800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -5.86    |
| fps                | 854      |
| nupdates           | 135500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 677500   |
| value_loss         | 0.00016  |
---------------------------------
---------------------------------
| explained_variance | -0.02    |
| fps                | 854      |
| nupdates           | 135600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 678000   |
| value_loss         | 0.000167 |
---------------------------------
---------------------------------
| explained_variance | -1.17    |
| fps                | 854      |
| nupdates           | 135700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 678500   |
| value_loss         | 0.00035  |
---------------------------------
---------------------------------
| explained_variance | -0.807   |
| fps                | 854      |
| nupdates           | 135800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.392   |
| fps                | 856      |
| nupdates           | 138600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 693000   |
| value_loss         | 0.00027  |
---------------------------------
---------------------------------
| explained_variance | 0.104    |
| fps                | 857      |
| nupdates           | 138700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 693500   |
| value_loss         | 0.00027  |
---------------------------------
---------------------------------
| explained_variance | 0.313    |
| fps                | 857      |
| nupdates           | 138800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 694000   |
| value_loss         | 0.000121 |
---------------------------------
---------------------------------
| explained_variance | -13.3    |
| fps                | 857      |
| nupdates           | 138900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.507    |
| fps                | 854      |
| nupdates           | 141600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 708000   |
| value_loss         | 2.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.77    |
| fps                | 854      |
| nupdates           | 141700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 708500   |
| value_loss         | 0.000298 |
---------------------------------
---------------------------------
| explained_variance | -0.326   |
| fps                | 854      |
| nupdates           | 141800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 709000   |
| value_loss         | 0.00014  |
---------------------------------
---------------------------------
| explained_variance | -0.712   |
| fps                | 854      |
| nupdates           | 141900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -4.6     |
| fps                | 856      |
| nupdates           | 144700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 723500   |
| value_loss         | 0.00034  |
---------------------------------
---------------------------------
| explained_variance | -11.1    |
| fps                | 856      |
| nupdates           | 144800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 724000   |
| value_loss         | 7.8e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.231   |
| fps                | 856      |
| nupdates           | 144900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 724500   |
| value_loss         | 0.000364 |
---------------------------------
Eval num_timesteps=725000, episode_reward=-4.90 +/- 0.30
Episode length: 665.20 +/- 186.13
---------------------------------
| explained_variance | -0.354   |
| fps                | 85

---------------------------------
| explained_variance | 0.966    |
| fps                | 854      |
| nupdates           | 147700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 738500   |
| value_loss         | 1.01e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.227   |
| fps                | 854      |
| nupdates           | 147800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 739000   |
| value_loss         | 0.00043  |
---------------------------------
---------------------------------
| explained_variance | 0.301    |
| fps                | 854      |
| nupdates           | 147900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 739500   |
| value_loss         | 0.000285 |
---------------------------------
---------------------------------
| explained_variance | 0.289    |
| fps                | 854      |
| nupdates           | 148000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.76     |
| fps                | 852      |
| nupdates           | 150700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 753500   |
| value_loss         | 0.000152 |
---------------------------------
---------------------------------
| explained_variance | -0.043   |
| fps                | 852      |
| nupdates           | 150800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 754000   |
| value_loss         | 0.000177 |
---------------------------------
---------------------------------
| explained_variance | 0.527    |
| fps                | 852      |
| nupdates           | 150900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 754500   |
| value_loss         | 5.34e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.703    |
| fps                | 852      |
| nupdates           | 151000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.64    |
| fps                | 854      |
| nupdates           | 153800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 769000   |
| value_loss         | 0.00029  |
---------------------------------
---------------------------------
| explained_variance | 0.832    |
| fps                | 854      |
| nupdates           | 153900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 769500   |
| value_loss         | 3.11e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.455    |
| fps                | 854      |
| nupdates           | 154000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 770000   |
| value_loss         | 0.000799 |
---------------------------------
---------------------------------
| explained_variance | 0.447    |
| fps                | 854      |
| nupdates           | 154100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.625    |
| fps                | 853      |
| nupdates           | 156800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 784000   |
| value_loss         | 5.95e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.132    |
| fps                | 853      |
| nupdates           | 156900   |
| policy_entropy     | 2.03     |
| total_timesteps    | 784500   |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | 0.726    |
| fps                | 853      |
| nupdates           | 157000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 785000   |
| value_loss         | 0.000154 |
---------------------------------
---------------------------------
| explained_variance | -0.382   |
| fps                | 853      |
| nupdates           | 157100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -5.51    |
| fps                | 856      |
| nupdates           | 159900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 799500   |
| value_loss         | 0.000594 |
---------------------------------
Eval num_timesteps=800000, episode_reward=-5.00 +/- 0.00
Episode length: 553.90 +/- 121.85
---------------------------------
| explained_variance | 0.779    |
| fps                | 852      |
| nupdates           | 160000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 800000   |
| value_loss         | 1.43e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.94    |
| fps                | 853      |
| nupdates           | 160100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 800500   |
| value_loss         | 7.34e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.91    |
| fps                | 85

---------------------------------
| explained_variance | 0.414    |
| fps                | 854      |
| nupdates           | 162900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 814500   |
| value_loss         | 0.000238 |
---------------------------------
---------------------------------
| explained_variance | 0.532    |
| fps                | 854      |
| nupdates           | 163000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 815000   |
| value_loss         | 0.000485 |
---------------------------------
---------------------------------
| explained_variance | 0.491    |
| fps                | 854      |
| nupdates           | 163100   |
| policy_entropy     | 1.95     |
| total_timesteps    | 815500   |
| value_loss         | 0.923    |
---------------------------------
---------------------------------
| explained_variance | 0.892    |
| fps                | 854      |
| nupdates           | 163200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.871    |
| fps                | 853      |
| nupdates           | 165900   |
| policy_entropy     | 1.91     |
| total_timesteps    | 829500   |
| value_loss         | 0.000266 |
---------------------------------
---------------------------------
| explained_variance | -4.99    |
| fps                | 853      |
| nupdates           | 166000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 830000   |
| value_loss         | 0.000146 |
---------------------------------
---------------------------------
| explained_variance | -2.47    |
| fps                | 853      |
| nupdates           | 166100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 830500   |
| value_loss         | 0.00105  |
---------------------------------
---------------------------------
| explained_variance | 0.293    |
| fps                | 853      |
| nupdates           | 166200   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -5.12    |
| fps                | 855      |
| nupdates           | 169000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 845000   |
| value_loss         | 0.000382 |
---------------------------------
---------------------------------
| explained_variance | -1.11    |
| fps                | 855      |
| nupdates           | 169100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 845500   |
| value_loss         | 0.000248 |
---------------------------------
---------------------------------
| explained_variance | -0.351   |
| fps                | 855      |
| nupdates           | 169200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 846000   |
| value_loss         | 0.000121 |
---------------------------------
---------------------------------
| explained_variance | -1.08    |
| fps                | 855      |
| nupdates           | 169300   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.872    |
| fps                | 854      |
| nupdates           | 172000   |
| policy_entropy     | 2.02     |
| total_timesteps    | 860000   |
| value_loss         | 7.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.128    |
| fps                | 854      |
| nupdates           | 172100   |
| policy_entropy     | 2.04     |
| total_timesteps    | 860500   |
| value_loss         | 0.000286 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 854      |
| nupdates           | 172200   |
| policy_entropy     | 2.02     |
| total_timesteps    | 861000   |
| value_loss         | 2.79e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.907    |
| fps                | 854      |
| nupdates           | 172300   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.581    |
| fps                | 853      |
| nupdates           | 175100   |
| policy_entropy     | 1.83     |
| total_timesteps    | 875500   |
| value_loss         | 0.000326 |
---------------------------------
---------------------------------
| explained_variance | -1.75    |
| fps                | 853      |
| nupdates           | 175200   |
| policy_entropy     | 2.03     |
| total_timesteps    | 876000   |
| value_loss         | 0.000359 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 853      |
| nupdates           | 175300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 876500   |
| value_loss         | 9e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.56     |
| fps                | 853      |
| nupdates           | 175400   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.895    |
| fps                | 856      |
| nupdates           | 178200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 891000   |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | 0.657    |
| fps                | 856      |
| nupdates           | 178300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 891500   |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | 0.354    |
| fps                | 856      |
| nupdates           | 178400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 892000   |
| value_loss         | 0.000149 |
---------------------------------
---------------------------------
| explained_variance | -0.656   |
| fps                | 856      |
| nupdates           | 178500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.957    |
| fps                | 855      |
| nupdates           | 181200   |
| policy_entropy     | 2.02     |
| total_timesteps    | 906000   |
| value_loss         | 3.51e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.875   |
| fps                | 855      |
| nupdates           | 181300   |
| policy_entropy     | 2.03     |
| total_timesteps    | 906500   |
| value_loss         | 0.000312 |
---------------------------------
---------------------------------
| explained_variance | -3.06    |
| fps                | 855      |
| nupdates           | 181400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 907000   |
| value_loss         | 0.000137 |
---------------------------------
---------------------------------
| explained_variance | 0.692    |
| fps                | 855      |
| nupdates           | 181500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.604    |
| fps                | 857      |
| nupdates           | 184300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 921500   |
| value_loss         | 6.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.957    |
| fps                | 857      |
| nupdates           | 184400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 922000   |
| value_loss         | 0.000129 |
---------------------------------
---------------------------------
| explained_variance | -2.34    |
| fps                | 857      |
| nupdates           | 184500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 922500   |
| value_loss         | 0.00288  |
---------------------------------
---------------------------------
| explained_variance | 0.771    |
| fps                | 857      |
| nupdates           | 184600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.13    |
| fps                | 855      |
| nupdates           | 187300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 936500   |
| value_loss         | 3.36e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0226  |
| fps                | 855      |
| nupdates           | 187400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 937000   |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.974    |
| fps                | 855      |
| nupdates           | 187500   |
| policy_entropy     | 1.98     |
| total_timesteps    | 937500   |
| value_loss         | 0.00584  |
---------------------------------
---------------------------------
| explained_variance | -3.59    |
| fps                | 855      |
| nupdates           | 187600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.883    |
| fps                | 854      |
| nupdates           | 190300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 951500   |
| value_loss         | 0.000401 |
---------------------------------
---------------------------------
| explained_variance | 0.816    |
| fps                | 854      |
| nupdates           | 190400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 952000   |
| value_loss         | 1.86e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.31    |
| fps                | 854      |
| nupdates           | 190500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 952500   |
| value_loss         | 0.000486 |
---------------------------------
---------------------------------
| explained_variance | -0.033   |
| fps                | 854      |
| nupdates           | 190600   |
| policy_entropy     | 1.99     |
| total_timest

---------------------------------
| explained_variance | 0.744    |
| fps                | 855      |
| nupdates           | 193400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 967000   |
| value_loss         | 0.000175 |
---------------------------------
---------------------------------
| explained_variance | 0.356    |
| fps                | 855      |
| nupdates           | 193500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 967500   |
| value_loss         | 0.000344 |
---------------------------------
---------------------------------
| explained_variance | -4.96    |
| fps                | 855      |
| nupdates           | 193600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 968000   |
| value_loss         | 0.00295  |
---------------------------------
---------------------------------
| explained_variance | -0.0166  |
| fps                | 855      |
| nupdates           | 193700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.286    |
| fps                | 854      |
| nupdates           | 196400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 982000   |
| value_loss         | 0.000114 |
---------------------------------
---------------------------------
| explained_variance | 0.507    |
| fps                | 854      |
| nupdates           | 196500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 982500   |
| value_loss         | 0.000224 |
---------------------------------
---------------------------------
| explained_variance | 0.281    |
| fps                | 854      |
| nupdates           | 196600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 983000   |
| value_loss         | 6.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.479    |
| fps                | 854      |
| nupdates           | 196700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.423    |
| fps                | 856      |
| nupdates           | 199500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 997500   |
| value_loss         | 0.000783 |
---------------------------------
---------------------------------
| explained_variance | 0.298    |
| fps                | 856      |
| nupdates           | 199600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 998000   |
| value_loss         | 0.000133 |
---------------------------------
---------------------------------
| explained_variance | -1.76    |
| fps                | 856      |
| nupdates           | 199700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 998500   |
| value_loss         | 4.96e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.373    |
| fps                | 857      |
| nupdates           | 199800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.484    |
| fps                | 856      |
| nupdates           | 202500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1012500  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | 0.377    |
| fps                | 856      |
| nupdates           | 202600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1013000  |
| value_loss         | 9.77e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.76    |
| fps                | 856      |
| nupdates           | 202700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1013500  |
| value_loss         | 0.000451 |
---------------------------------
---------------------------------
| explained_variance | -5.95    |
| fps                | 856      |
| nupdates           | 202800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.296    |
| fps                | 854      |
| nupdates           | 205500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1027500  |
| value_loss         | 0.12     |
---------------------------------
---------------------------------
| explained_variance | 0.8      |
| fps                | 854      |
| nupdates           | 205600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1028000  |
| value_loss         | 8.24e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.831    |
| fps                | 854      |
| nupdates           | 205700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1028500  |
| value_loss         | 2.19e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.02    |
| fps                | 855      |
| nupdates           | 205800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.9     |
| fps                | 856      |
| nupdates           | 208600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1043000  |
| value_loss         | 0.000657 |
---------------------------------
---------------------------------
| explained_variance | -0.536   |
| fps                | 856      |
| nupdates           | 208700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1043500  |
| value_loss         | 0.000401 |
---------------------------------
---------------------------------
| explained_variance | -0.504   |
| fps                | 856      |
| nupdates           | 208800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1044000  |
| value_loss         | 6.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.923    |
| fps                | 856      |
| nupdates           | 208900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.857   |
| fps                | 854      |
| nupdates           | 211600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1058000  |
| value_loss         | 0.000193 |
---------------------------------
---------------------------------
| explained_variance | -3.34    |
| fps                | 855      |
| nupdates           | 211700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1058500  |
| value_loss         | 9.24e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0445   |
| fps                | 855      |
| nupdates           | 211800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1059000  |
| value_loss         | 0.000304 |
---------------------------------
---------------------------------
| explained_variance | 0.722    |
| fps                | 855      |
| nupdates           | 211900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.746    |
| fps                | 856      |
| nupdates           | 214700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1073500  |
| value_loss         | 4.71e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.87    |
| fps                | 856      |
| nupdates           | 214800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1074000  |
| value_loss         | 0.00113  |
---------------------------------
---------------------------------
| explained_variance | 0.528    |
| fps                | 856      |
| nupdates           | 214900   |
| policy_entropy     | 2.01     |
| total_timesteps    | 1074500  |
| value_loss         | 0.000162 |
---------------------------------
Eval num_timesteps=1075000, episode_reward=-5.00 +/- 0.00
Episode length: 740.90 +/- 170.40
---------------------------------
| explained_variance | -0.201   |
| fps                | 8

---------------------------------
| explained_variance | -6       |
| fps                | 854      |
| nupdates           | 217700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1088500  |
| value_loss         | 0.00021  |
---------------------------------
---------------------------------
| explained_variance | -1.09    |
| fps                | 854      |
| nupdates           | 217800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1089000  |
| value_loss         | 0.000341 |
---------------------------------
---------------------------------
| explained_variance | 0.823    |
| fps                | 854      |
| nupdates           | 217900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1089500  |
| value_loss         | 0.000235 |
---------------------------------
---------------------------------
| explained_variance | -1.98    |
| fps                | 854      |
| nupdates           | 218000   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.5     |
| fps                | 853      |
| nupdates           | 220700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1103500  |
| value_loss         | 3.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.77     |
| fps                | 853      |
| nupdates           | 220800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1104000  |
| value_loss         | 8.8e-05  |
---------------------------------
---------------------------------
| explained_variance | -38.5    |
| fps                | 853      |
| nupdates           | 220900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1104500  |
| value_loss         | 0.00494  |
---------------------------------
---------------------------------
| explained_variance | -0.45    |
| fps                | 853      |
| nupdates           | 221000   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.362    |
| fps                | 855      |
| nupdates           | 223800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1119000  |
| value_loss         | 0.151    |
---------------------------------
---------------------------------
| explained_variance | -3.53    |
| fps                | 855      |
| nupdates           | 223900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1119500  |
| value_loss         | 0.000238 |
---------------------------------
----------------------------------
| explained_variance | -2.63e+03 |
| fps                | 855       |
| nupdates           | 224000    |
| policy_entropy     | 1.99      |
| total_timesteps    | 1120000   |
| value_loss         | 0.124     |
----------------------------------
---------------------------------
| explained_variance | -1.89    |
| fps                | 855      |
| nupdates           | 224100   |
| policy_entropy     | 2.03     |
| tota

---------------------------------
| explained_variance | 0.751    |
| fps                | 854      |
| nupdates           | 226800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1134000  |
| value_loss         | 6.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.99     |
| fps                | 854      |
| nupdates           | 226900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1134500  |
| value_loss         | 2.96e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.501    |
| fps                | 854      |
| nupdates           | 227000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1135000  |
| value_loss         | 0.000396 |
---------------------------------
---------------------------------
| explained_variance | 0.614    |
| fps                | 854      |
| nupdates           | 227100   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.267    |
| fps                | 855      |
| nupdates           | 229900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1149500  |
| value_loss         | 5.84e-05 |
---------------------------------
Eval num_timesteps=1150000, episode_reward=-4.90 +/- 0.30
Episode length: 613.40 +/- 146.08
---------------------------------
| explained_variance | -2.84    |
| fps                | 853      |
| nupdates           | 230000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1150000  |
| value_loss         | 0.000213 |
---------------------------------
---------------------------------
| explained_variance | -3.81    |
| fps                | 853      |
| nupdates           | 230100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1150500  |
| value_loss         | 0.00391  |
---------------------------------
---------------------------------
| explained_variance | -1.75    |
| fps                | 8

---------------------------------
| explained_variance | 0.284    |
| fps                | 854      |
| nupdates           | 232900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1164500  |
| value_loss         | 7.84e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.04    |
| fps                | 854      |
| nupdates           | 233000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1165000  |
| value_loss         | 0.000271 |
---------------------------------
---------------------------------
| explained_variance | -108     |
| fps                | 854      |
| nupdates           | 233100   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1165500  |
| value_loss         | 0.014    |
---------------------------------
---------------------------------
| explained_variance | -0.89    |
| fps                | 854      |
| nupdates           | 233200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.865    |
| fps                | 853      |
| nupdates           | 235900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1179500  |
| value_loss         | 3.52e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.11    |
| fps                | 853      |
| nupdates           | 236000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1180000  |
| value_loss         | 0.000286 |
---------------------------------
---------------------------------
| explained_variance | -0.145   |
| fps                | 853      |
| nupdates           | 236100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1180500  |
| value_loss         | 0.000863 |
---------------------------------
---------------------------------
| explained_variance | -4.12    |
| fps                | 853      |
| nupdates           | 236200   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.456    |
| fps                | 855      |
| nupdates           | 239000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1195000  |
| value_loss         | 0.000357 |
---------------------------------
----------------------------------
| explained_variance | -6.95e+03 |
| fps                | 855       |
| nupdates           | 239100    |
| policy_entropy     | 2.05      |
| total_timesteps    | 1195500   |
| value_loss         | 0.154     |
----------------------------------
---------------------------------
| explained_variance | 0.759    |
| fps                | 855      |
| nupdates           | 239200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1196000  |
| value_loss         | 0.000164 |
---------------------------------
---------------------------------
| explained_variance | -7.92    |
| fps                | 855      |
| nupdates           | 239300   |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | -0.67    |
| fps                | 853      |
| nupdates           | 242000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1210000  |
| value_loss         | 0.00807  |
---------------------------------
---------------------------------
| explained_variance | -8.6     |
| fps                | 853      |
| nupdates           | 242100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1210500  |
| value_loss         | 0.00053  |
---------------------------------
---------------------------------
| explained_variance | -0.281   |
| fps                | 853      |
| nupdates           | 242200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1211000  |
| value_loss         | 0.00108  |
---------------------------------
---------------------------------
| explained_variance | 0.733    |
| fps                | 853      |
| nupdates           | 242300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -38.7    |
| fps                | 852      |
| nupdates           | 245100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1225500  |
| value_loss         | 0.00676  |
---------------------------------
---------------------------------
| explained_variance | 0.156    |
| fps                | 852      |
| nupdates           | 245200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1226000  |
| value_loss         | 4.7e-05  |
---------------------------------
---------------------------------
| explained_variance | -4.59    |
| fps                | 852      |
| nupdates           | 245300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1226500  |
| value_loss         | 0.000178 |
---------------------------------
---------------------------------
| explained_variance | 0.809    |
| fps                | 852      |
| nupdates           | 245400   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.0569  |
| fps                | 853      |
| nupdates           | 248200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1241000  |
| value_loss         | 0.000275 |
---------------------------------
---------------------------------
| explained_variance | -3.99    |
| fps                | 853      |
| nupdates           | 248300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1241500  |
| value_loss         | 0.000798 |
---------------------------------
---------------------------------
| explained_variance | 0.418    |
| fps                | 853      |
| nupdates           | 248400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1242000  |
| value_loss         | 0.000143 |
---------------------------------
---------------------------------
| explained_variance | 0.562    |
| fps                | 854      |
| nupdates           | 248500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.866    |
| fps                | 852      |
| nupdates           | 251200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1256000  |
| value_loss         | 0.000274 |
---------------------------------
---------------------------------
| explained_variance | -51      |
| fps                | 852      |
| nupdates           | 251300   |
| policy_entropy     | 2.01     |
| total_timesteps    | 1256500  |
| value_loss         | 0.00416  |
---------------------------------
---------------------------------
| explained_variance | 0.788    |
| fps                | 852      |
| nupdates           | 251400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1257000  |
| value_loss         | 2.73e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.11    |
| fps                | 852      |
| nupdates           | 251500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.577    |
| fps                | 854      |
| nupdates           | 254300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1271500  |
| value_loss         | 5.53e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 854      |
| nupdates           | 254400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1272000  |
| value_loss         | 7.43e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0617   |
| fps                | 854      |
| nupdates           | 254500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1272500  |
| value_loss         | 4.52e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.607    |
| fps                | 854      |
| nupdates           | 254600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.978    |
| fps                | 853      |
| nupdates           | 257300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1286500  |
| value_loss         | 1.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.267    |
| fps                | 853      |
| nupdates           | 257400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1287000  |
| value_loss         | 0.000302 |
---------------------------------
---------------------------------
| explained_variance | -1.04    |
| fps                | 853      |
| nupdates           | 257500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1287500  |
| value_loss         | 0.000178 |
---------------------------------
---------------------------------
| explained_variance | -4.46    |
| fps                | 853      |
| nupdates           | 257600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.51     |
| fps                | 852      |
| nupdates           | 260300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1301500  |
| value_loss         | 9.08e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.856   |
| fps                | 852      |
| nupdates           | 260400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1302000  |
| value_loss         | 9.09e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.628    |
| fps                | 852      |
| nupdates           | 260500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1302500  |
| value_loss         | 1.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.838    |
| fps                | 852      |
| nupdates           | 260600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.26    |
| fps                | 853      |
| nupdates           | 263400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1317000  |
| value_loss         | 4.04e-05 |
---------------------------------
---------------------------------
| explained_variance | -165     |
| fps                | 853      |
| nupdates           | 263500   |
| policy_entropy     | 2        |
| total_timesteps    | 1317500  |
| value_loss         | 0.0644   |
---------------------------------
---------------------------------
| explained_variance | 0.312    |
| fps                | 853      |
| nupdates           | 263600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1318000  |
| value_loss         | 0.202    |
---------------------------------
---------------------------------
| explained_variance | 0.627    |
| fps                | 853      |
| nupdates           | 263700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.674   |
| fps                | 852      |
| nupdates           | 266400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1332000  |
| value_loss         | 0.000291 |
---------------------------------
---------------------------------
| explained_variance | 0.849    |
| fps                | 852      |
| nupdates           | 266500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1332500  |
| value_loss         | 5.2e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.754    |
| fps                | 852      |
| nupdates           | 266600   |
| policy_entropy     | 2.01     |
| total_timesteps    | 1333000  |
| value_loss         | 5.04e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.66    |
| fps                | 852      |
| nupdates           | 266700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -23.9    |
| fps                | 853      |
| nupdates           | 269500   |
| policy_entropy     | 2        |
| total_timesteps    | 1347500  |
| value_loss         | 0.00286  |
---------------------------------
---------------------------------
| explained_variance | -1.02    |
| fps                | 853      |
| nupdates           | 269600   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1348000  |
| value_loss         | 0.000284 |
---------------------------------
---------------------------------
| explained_variance | 0.586    |
| fps                | 853      |
| nupdates           | 269700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1348500  |
| value_loss         | 0.000286 |
---------------------------------
---------------------------------
| explained_variance | 0.734    |
| fps                | 853      |
| nupdates           | 269800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -132     |
| fps                | 852      |
| nupdates           | 272500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1362500  |
| value_loss         | 0.0168   |
---------------------------------
---------------------------------
| explained_variance | 0.975    |
| fps                | 852      |
| nupdates           | 272600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1363000  |
| value_loss         | 4.02e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.22    |
| fps                | 852      |
| nupdates           | 272700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1363500  |
| value_loss         | 0.00107  |
---------------------------------
---------------------------------
| explained_variance | -4.53    |
| fps                | 852      |
| nupdates           | 272800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -37.7    |
| fps                | 851      |
| nupdates           | 275500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1377500  |
| value_loss         | 0.009    |
---------------------------------
---------------------------------
| explained_variance | 0.123    |
| fps                | 851      |
| nupdates           | 275600   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1378000  |
| value_loss         | 0.000211 |
---------------------------------
---------------------------------
| explained_variance | 0.57     |
| fps                | 851      |
| nupdates           | 275700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1378500  |
| value_loss         | 2.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.251    |
| fps                | 851      |
| nupdates           | 275800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.979    |
| fps                | 852      |
| nupdates           | 278600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1393000  |
| value_loss         | 0.0101   |
---------------------------------
---------------------------------
| explained_variance | 0.915    |
| fps                | 852      |
| nupdates           | 278700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1393500  |
| value_loss         | 7.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.58     |
| fps                | 852      |
| nupdates           | 278800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1394000  |
| value_loss         | 0.000472 |
---------------------------------
---------------------------------
| explained_variance | 0.964    |
| fps                | 852      |
| nupdates           | 278900   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.82    |
| fps                | 851      |
| nupdates           | 281600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1408000  |
| value_loss         | 3.52e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.153    |
| fps                | 851      |
| nupdates           | 281700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1408500  |
| value_loss         | 0.000277 |
---------------------------------
---------------------------------
| explained_variance | 0.806    |
| fps                | 852      |
| nupdates           | 281800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1409000  |
| value_loss         | 2e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.302    |
| fps                | 852      |
| nupdates           | 281900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.276    |
| fps                | 853      |
| nupdates           | 284700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1423500  |
| value_loss         | 5.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.432    |
| fps                | 853      |
| nupdates           | 284800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1424000  |
| value_loss         | 0.000213 |
---------------------------------
---------------------------------
| explained_variance | 0.456    |
| fps                | 853      |
| nupdates           | 284900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1424500  |
| value_loss         | 0.000502 |
---------------------------------
Eval num_timesteps=1425000, episode_reward=-4.60 +/- 0.66
Episode length: 626.80 +/- 141.53
---------------------------------
| explained_variance | 0.99     |
| fps                | 8

---------------------------------
| explained_variance | -8.43    |
| fps                | 852      |
| nupdates           | 287700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1438500  |
| value_loss         | 0.000589 |
---------------------------------
---------------------------------
| explained_variance | -2.71    |
| fps                | 852      |
| nupdates           | 287800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1439000  |
| value_loss         | 0.00115  |
---------------------------------
----------------------------------
| explained_variance | -2.57e+03 |
| fps                | 852       |
| nupdates           | 287900    |
| policy_entropy     | 2.05      |
| total_timesteps    | 1439500   |
| value_loss         | 0.0941    |
----------------------------------
---------------------------------
| explained_variance | 0.76     |
| fps                | 852      |
| nupdates           | 288000   |
| policy_entropy     | 2.05     |
| tota

---------------------------------
| explained_variance | -70.3    |
| fps                | 850      |
| nupdates           | 290700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1453500  |
| value_loss         | 0.0101   |
---------------------------------
---------------------------------
| explained_variance | 0.541    |
| fps                | 850      |
| nupdates           | 290800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1454000  |
| value_loss         | 3.66e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.607    |
| fps                | 851      |
| nupdates           | 290900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1454500  |
| value_loss         | 3.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.774    |
| fps                | 851      |
| nupdates           | 291000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.349    |
| fps                | 852      |
| nupdates           | 293800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1469000  |
| value_loss         | 0.0003   |
---------------------------------
---------------------------------
| explained_variance | 0.887    |
| fps                | 852      |
| nupdates           | 293900   |
| policy_entropy     | 1.99     |
| total_timesteps    | 1469500  |
| value_loss         | 0.000228 |
---------------------------------
---------------------------------
| explained_variance | 0.474    |
| fps                | 852      |
| nupdates           | 294000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1470000  |
| value_loss         | 0.00024  |
---------------------------------
---------------------------------
| explained_variance | -0.995   |
| fps                | 852      |
| nupdates           | 294100   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.342    |
| fps                | 851      |
| nupdates           | 296800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1484000  |
| value_loss         | 0.000366 |
---------------------------------
---------------------------------
| explained_variance | 0.575    |
| fps                | 851      |
| nupdates           | 296900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1484500  |
| value_loss         | 0.00026  |
---------------------------------
---------------------------------
| explained_variance | -5.3     |
| fps                | 851      |
| nupdates           | 297000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1485000  |
| value_loss         | 0.0017   |
---------------------------------
---------------------------------
| explained_variance | 0.0897   |
| fps                | 851      |
| nupdates           | 297100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.998    |
| fps                | 852      |
| nupdates           | 299900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1499500  |
| value_loss         | 2.84e-06 |
---------------------------------
Eval num_timesteps=1500000, episode_reward=-4.80 +/- 0.40
Episode length: 611.90 +/- 138.94
---------------------------------
| explained_variance | -0.753   |
| fps                | 850      |
| nupdates           | 300000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1500000  |
| value_loss         | 0.00016  |
---------------------------------
---------------------------------
| explained_variance | 0.449    |
| fps                | 850      |
| nupdates           | 300100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1500500  |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | -9.1e+03 |
| fps                | 8

---------------------------------
| explained_variance | 0.815    |
| fps                | 851      |
| nupdates           | 302900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1514500  |
| value_loss         | 5.91e-06 |
---------------------------------
---------------------------------
| explained_variance | -14.1    |
| fps                | 851      |
| nupdates           | 303000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1515000  |
| value_loss         | 0.00073  |
---------------------------------
---------------------------------
| explained_variance | 0.876    |
| fps                | 851      |
| nupdates           | 303100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1515500  |
| value_loss         | 4.91e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.758   |
| fps                | 851      |
| nupdates           | 303200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.715    |
| fps                | 851      |
| nupdates           | 305900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1529500  |
| value_loss         | 4.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.633    |
| fps                | 851      |
| nupdates           | 306000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1530000  |
| value_loss         | 7.36e-06 |
---------------------------------
---------------------------------
| explained_variance | -5.62    |
| fps                | 851      |
| nupdates           | 306100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1530500  |
| value_loss         | 7.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.84     |
| fps                | 851      |
| nupdates           | 306200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -5.83    |
| fps                | 852      |
| nupdates           | 309000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1545000  |
| value_loss         | 0.000669 |
---------------------------------
---------------------------------
| explained_variance | -3.44    |
| fps                | 852      |
| nupdates           | 309100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1545500  |
| value_loss         | 5.78e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.27    |
| fps                | 852      |
| nupdates           | 309200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1546000  |
| value_loss         | 0.000137 |
---------------------------------
---------------------------------
| explained_variance | -0.198   |
| fps                | 852      |
| nupdates           | 309300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.743    |
| fps                | 852      |
| nupdates           | 312000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1560000  |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | 0.206    |
| fps                | 852      |
| nupdates           | 312100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1560500  |
| value_loss         | 0.00015  |
---------------------------------
---------------------------------
| explained_variance | 0.92     |
| fps                | 852      |
| nupdates           | 312200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1561000  |
| value_loss         | 0.000195 |
---------------------------------
---------------------------------
| explained_variance | 0.969    |
| fps                | 852      |
| nupdates           | 312300   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.09    |
| fps                | 852      |
| nupdates           | 315100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1575500  |
| value_loss         | 0.000284 |
---------------------------------
---------------------------------
| explained_variance | 0.971    |
| fps                | 852      |
| nupdates           | 315200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1576000  |
| value_loss         | 6.27e-06 |
---------------------------------
---------------------------------
| explained_variance | -5.42    |
| fps                | 852      |
| nupdates           | 315300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1576500  |
| value_loss         | 0.000176 |
---------------------------------
---------------------------------
| explained_variance | -3.15    |
| fps                | 852      |
| nupdates           | 315400   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -19.5    |
| fps                | 853      |
| nupdates           | 318200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1591000  |
| value_loss         | 0.000991 |
---------------------------------
---------------------------------
| explained_variance | 0.0685   |
| fps                | 853      |
| nupdates           | 318300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1591500  |
| value_loss         | 0.000273 |
---------------------------------
---------------------------------
| explained_variance | 0.545    |
| fps                | 853      |
| nupdates           | 318400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1592000  |
| value_loss         | 9.57e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.485    |
| fps                | 853      |
| nupdates           | 318500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -2.37    |
| fps                | 852      |
| nupdates           | 321200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1606000  |
| value_loss         | 0.00268  |
---------------------------------
---------------------------------
| explained_variance | -1.82    |
| fps                | 852      |
| nupdates           | 321300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1606500  |
| value_loss         | 0.000866 |
---------------------------------
---------------------------------
| explained_variance | 0.331    |
| fps                | 852      |
| nupdates           | 321400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1607000  |
| value_loss         | 0.000413 |
---------------------------------
---------------------------------
| explained_variance | 0.851    |
| fps                | 852      |
| nupdates           | 321500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.998    |
| fps                | 853      |
| nupdates           | 324300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1621500  |
| value_loss         | 0.000957 |
---------------------------------
---------------------------------
| explained_variance | -2.22    |
| fps                | 853      |
| nupdates           | 324400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1622000  |
| value_loss         | 0.000216 |
---------------------------------
---------------------------------
| explained_variance | 0.915    |
| fps                | 853      |
| nupdates           | 324500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1622500  |
| value_loss         | 0.000148 |
---------------------------------
---------------------------------
| explained_variance | 0.976    |
| fps                | 853      |
| nupdates           | 324600   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.72    |
| fps                | 852      |
| nupdates           | 327300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1636500  |
| value_loss         | 0.00128  |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 852      |
| nupdates           | 327400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1637000  |
| value_loss         | 6.48e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.787    |
| fps                | 852      |
| nupdates           | 327500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1637500  |
| value_loss         | 0.00105  |
---------------------------------
---------------------------------
| explained_variance | -2.88    |
| fps                | 852      |
| nupdates           | 327600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.908    |
| fps                | 852      |
| nupdates           | 330300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1651500  |
| value_loss         | 5.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.44     |
| fps                | 852      |
| nupdates           | 330400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1652000  |
| value_loss         | 0.00217  |
---------------------------------
---------------------------------
| explained_variance | 0.423    |
| fps                | 852      |
| nupdates           | 330500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1652500  |
| value_loss         | 0.138    |
---------------------------------
---------------------------------
| explained_variance | -28.6    |
| fps                | 852      |
| nupdates           | 330600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.443    |
| fps                | 852      |
| nupdates           | 333400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1667000  |
| value_loss         | 7.13e-06 |
---------------------------------
---------------------------------
| explained_variance | -8.55    |
| fps                | 852      |
| nupdates           | 333500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1667500  |
| value_loss         | 0.000128 |
---------------------------------
---------------------------------
| explained_variance | 0.637    |
| fps                | 853      |
| nupdates           | 333600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1668000  |
| value_loss         | 0.000873 |
---------------------------------
---------------------------------
| explained_variance | 0.136    |
| fps                | 853      |
| nupdates           | 333700   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -13.1    |
| fps                | 852      |
| nupdates           | 336400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1682000  |
| value_loss         | 0.00129  |
---------------------------------
---------------------------------
| explained_variance | 0.767    |
| fps                | 852      |
| nupdates           | 336500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1682500  |
| value_loss         | 9.28e-05 |
---------------------------------
---------------------------------
| explained_variance | -32.6    |
| fps                | 852      |
| nupdates           | 336600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1683000  |
| value_loss         | 0.0203   |
---------------------------------
---------------------------------
| explained_variance | -6.57    |
| fps                | 852      |
| nupdates           | 336700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.825    |
| fps                | 853      |
| nupdates           | 339500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1697500  |
| value_loss         | 0.000204 |
---------------------------------
---------------------------------
| explained_variance | 0.76     |
| fps                | 853      |
| nupdates           | 339600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1698000  |
| value_loss         | 2.35e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.574    |
| fps                | 853      |
| nupdates           | 339700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1698500  |
| value_loss         | 0.000214 |
---------------------------------
---------------------------------
| explained_variance | 0.87     |
| fps                | 853      |
| nupdates           | 339800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0428   |
| fps                | 852      |
| nupdates           | 342500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1712500  |
| value_loss         | 0.000125 |
---------------------------------
---------------------------------
| explained_variance | -0.723   |
| fps                | 852      |
| nupdates           | 342600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1713000  |
| value_loss         | 0.000307 |
---------------------------------
---------------------------------
| explained_variance | -5.84    |
| fps                | 852      |
| nupdates           | 342700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1713500  |
| value_loss         | 0.000711 |
---------------------------------
---------------------------------
| explained_variance | 0.0567   |
| fps                | 852      |
| nupdates           | 342800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.0332   |
| fps                | 852      |
| nupdates           | 345500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1727500  |
| value_loss         | 0.000117 |
---------------------------------
---------------------------------
| explained_variance | 0.731    |
| fps                | 852      |
| nupdates           | 345600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1728000  |
| value_loss         | 0.000219 |
---------------------------------
---------------------------------
| explained_variance | 0.817    |
| fps                | 852      |
| nupdates           | 345700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1728500  |
| value_loss         | 3.03e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.978    |
| fps                | 852      |
| nupdates           | 345800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.179   |
| fps                | 853      |
| nupdates           | 348600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1743000  |
| value_loss         | 0.000574 |
---------------------------------
---------------------------------
| explained_variance | -1.1     |
| fps                | 853      |
| nupdates           | 348700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1743500  |
| value_loss         | 0.000208 |
---------------------------------
---------------------------------
| explained_variance | -6.29    |
| fps                | 853      |
| nupdates           | 348800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1744000  |
| value_loss         | 0.000973 |
---------------------------------
---------------------------------
| explained_variance | -18.5    |
| fps                | 853      |
| nupdates           | 348900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.998    |
| fps                | 852      |
| nupdates           | 351600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1758000  |
| value_loss         | 0.000122 |
---------------------------------
---------------------------------
| explained_variance | -0.809   |
| fps                | 852      |
| nupdates           | 351700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1758500  |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | -0.109   |
| fps                | 852      |
| nupdates           | 351800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1759000  |
| value_loss         | 0.000199 |
---------------------------------
---------------------------------
| explained_variance | -0.349   |
| fps                | 852      |
| nupdates           | 351900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.999    |
| fps                | 853      |
| nupdates           | 354700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1773500  |
| value_loss         | 1.84e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.805    |
| fps                | 853      |
| nupdates           | 354800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1774000  |
| value_loss         | 0.00018  |
---------------------------------
---------------------------------
| explained_variance | 0.799    |
| fps                | 853      |
| nupdates           | 354900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1774500  |
| value_loss         | 4.91e-05 |
---------------------------------
Eval num_timesteps=1775000, episode_reward=-4.90 +/- 0.30
Episode length: 610.20 +/- 158.04
---------------------------------
| explained_variance | 0.996    |
| fps                | 8

---------------------------------
| explained_variance | -1.89    |
| fps                | 852      |
| nupdates           | 357700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1788500  |
| value_loss         | 5.87e-05 |
---------------------------------
---------------------------------
| explained_variance | -8.24    |
| fps                | 852      |
| nupdates           | 357800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1789000  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | -0.717   |
| fps                | 852      |
| nupdates           | 357900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1789500  |
| value_loss         | 0.00116  |
---------------------------------
---------------------------------
| explained_variance | -0.693   |
| fps                | 852      |
| nupdates           | 358000   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.708    |
| fps                | 851      |
| nupdates           | 360700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1803500  |
| value_loss         | 2.57e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.18    |
| fps                | 851      |
| nupdates           | 360800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1804000  |
| value_loss         | 0.000875 |
---------------------------------
---------------------------------
| explained_variance | 0.795    |
| fps                | 851      |
| nupdates           | 360900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1804500  |
| value_loss         | 0.000308 |
---------------------------------
---------------------------------
| explained_variance | -4.37    |
| fps                | 851      |
| nupdates           | 361000   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.88     |
| fps                | 852      |
| nupdates           | 363800   |
| policy_entropy     | 2.01     |
| total_timesteps    | 1819000  |
| value_loss         | 2.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.435    |
| fps                | 852      |
| nupdates           | 363900   |
| policy_entropy     | 2.01     |
| total_timesteps    | 1819500  |
| value_loss         | 0.132    |
---------------------------------
---------------------------------
| explained_variance | -0.341   |
| fps                | 852      |
| nupdates           | 364000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1820000  |
| value_loss         | 0.000368 |
---------------------------------
---------------------------------
| explained_variance | -0.0807  |
| fps                | 852      |
| nupdates           | 364100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.158    |
| fps                | 852      |
| nupdates           | 366800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1834000  |
| value_loss         | 0.000837 |
---------------------------------
---------------------------------
| explained_variance | -0.0303  |
| fps                | 852      |
| nupdates           | 366900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1834500  |
| value_loss         | 4.03e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.354    |
| fps                | 852      |
| nupdates           | 367000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1835000  |
| value_loss         | 0.155    |
---------------------------------
---------------------------------
| explained_variance | 0.582    |
| fps                | 852      |
| nupdates           | 367100   |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | -1.55    |
| fps                | 852      |
| nupdates           | 369900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1849500  |
| value_loss         | 0.000628 |
---------------------------------
Eval num_timesteps=1850000, episode_reward=-4.90 +/- 0.30
Episode length: 698.50 +/- 141.23
---------------------------------
| explained_variance | 0.29     |
| fps                | 851      |
| nupdates           | 370000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1850000  |
| value_loss         | 6.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0722  |
| fps                | 851      |
| nupdates           | 370100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1850500  |
| value_loss         | 0.000247 |
---------------------------------
---------------------------------
| explained_variance | 0.835    |
| fps                | 8

---------------------------------
| explained_variance | 0.965    |
| fps                | 852      |
| nupdates           | 372900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1864500  |
| value_loss         | 5.1e-05  |
---------------------------------
---------------------------------
| explained_variance | -1.04    |
| fps                | 852      |
| nupdates           | 373000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1865000  |
| value_loss         | 0.000251 |
---------------------------------
---------------------------------
| explained_variance | 0.457    |
| fps                | 852      |
| nupdates           | 373100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1865500  |
| value_loss         | 0.000453 |
---------------------------------
---------------------------------
| explained_variance | 0.527    |
| fps                | 852      |
| nupdates           | 373200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.12    |
| fps                | 851      |
| nupdates           | 375900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1879500  |
| value_loss         | 0.000274 |
---------------------------------
---------------------------------
| explained_variance | 0.844    |
| fps                | 851      |
| nupdates           | 376000   |
| policy_entropy     | 1.99     |
| total_timesteps    | 1880000  |
| value_loss         | 2.35e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.94    |
| fps                | 851      |
| nupdates           | 376100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1880500  |
| value_loss         | 0.000377 |
---------------------------------
---------------------------------
| explained_variance | 0.673    |
| fps                | 851      |
| nupdates           | 376200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.234    |
| fps                | 852      |
| nupdates           | 379000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1895000  |
| value_loss         | 0.000293 |
---------------------------------
---------------------------------
| explained_variance | 0.298    |
| fps                | 852      |
| nupdates           | 379100   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1895500  |
| value_loss         | 0.00036  |
---------------------------------
---------------------------------
| explained_variance | 0.968    |
| fps                | 852      |
| nupdates           | 379200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1896000  |
| value_loss         | 1.57e-05 |
---------------------------------
---------------------------------
| explained_variance | -8.28    |
| fps                | 852      |
| nupdates           | 379300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.339    |
| fps                | 851      |
| nupdates           | 382000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1910000  |
| value_loss         | 0.103    |
---------------------------------
---------------------------------
| explained_variance | -3.52    |
| fps                | 851      |
| nupdates           | 382100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1910500  |
| value_loss         | 0.000596 |
---------------------------------
---------------------------------
| explained_variance | -2.39    |
| fps                | 851      |
| nupdates           | 382200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1911000  |
| value_loss         | 4.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 851      |
| nupdates           | 382300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -108     |
| fps                | 850      |
| nupdates           | 385100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1925500  |
| value_loss         | 0.024    |
---------------------------------
---------------------------------
| explained_variance | -3.34    |
| fps                | 850      |
| nupdates           | 385200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1926000  |
| value_loss         | 7.34e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.594   |
| fps                | 850      |
| nupdates           | 385300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1926500  |
| value_loss         | 0.000496 |
---------------------------------
---------------------------------
| explained_variance | -6.55    |
| fps                | 851      |
| nupdates           | 385400   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.48    |
| fps                | 851      |
| nupdates           | 388200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1941000  |
| value_loss         | 7.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.688    |
| fps                | 851      |
| nupdates           | 388300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1941500  |
| value_loss         | 7.06e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.24    |
| fps                | 851      |
| nupdates           | 388400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1942000  |
| value_loss         | 0.000124 |
---------------------------------
---------------------------------
| explained_variance | 0.586    |
| fps                | 851      |
| nupdates           | 388500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.28    |
| fps                | 851      |
| nupdates           | 391200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1956000  |
| value_loss         | 4.77e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 851      |
| nupdates           | 391300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1956500  |
| value_loss         | 1.74e-05 |
---------------------------------
---------------------------------
| explained_variance | -5.38    |
| fps                | 851      |
| nupdates           | 391400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1957000  |
| value_loss         | 0.000623 |
---------------------------------
---------------------------------
| explained_variance | -86.7    |
| fps                | 851      |
| nupdates           | 391500   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.632    |
| fps                | 851      |
| nupdates           | 394300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1971500  |
| value_loss         | 0.000445 |
---------------------------------
---------------------------------
| explained_variance | 0.906    |
| fps                | 851      |
| nupdates           | 394400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1972000  |
| value_loss         | 1.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.552    |
| fps                | 851      |
| nupdates           | 394500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1972500  |
| value_loss         | 5.66e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 851      |
| nupdates           | 394600   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.0666   |
| fps                | 851      |
| nupdates           | 397300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1986500  |
| value_loss         | 0.000253 |
---------------------------------
---------------------------------
| explained_variance | -1.94    |
| fps                | 851      |
| nupdates           | 397400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1987000  |
| value_loss         | 0.000219 |
---------------------------------
---------------------------------
| explained_variance | -8.03    |
| fps                | 851      |
| nupdates           | 397500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1987500  |
| value_loss         | 0.00266  |
---------------------------------
---------------------------------
| explained_variance | 0.44     |
| fps                | 851      |
| nupdates           | 397600   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.983    |
| fps                | 850      |
| nupdates           | 400300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2001500  |
| value_loss         | 6.29e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.16    |
| fps                | 850      |
| nupdates           | 400400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2002000  |
| value_loss         | 0.000512 |
---------------------------------
---------------------------------
| explained_variance | -6.83    |
| fps                | 850      |
| nupdates           | 400500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2002500  |
| value_loss         | 0.00143  |
---------------------------------
---------------------------------
| explained_variance | 0.952    |
| fps                | 850      |
| nupdates           | 400600   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.805    |
| fps                | 851      |
| nupdates           | 403400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2017000  |
| value_loss         | 7.62e-06 |
---------------------------------
---------------------------------
| explained_variance | -6.66    |
| fps                | 851      |
| nupdates           | 403500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2017500  |
| value_loss         | 8.55e-05 |
---------------------------------
---------------------------------
| explained_variance | -8.33    |
| fps                | 851      |
| nupdates           | 403600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2018000  |
| value_loss         | 0.000919 |
---------------------------------
---------------------------------
| explained_variance | 0.952    |
| fps                | 851      |
| nupdates           | 403700   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.916    |
| fps                | 850      |
| nupdates           | 406400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2032000  |
| value_loss         | 5.02e-06 |
---------------------------------
---------------------------------
| explained_variance | -31.3    |
| fps                | 850      |
| nupdates           | 406500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2032500  |
| value_loss         | 0.000961 |
---------------------------------
---------------------------------
| explained_variance | -0.106   |
| fps                | 850      |
| nupdates           | 406600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2033000  |
| value_loss         | 0.000471 |
---------------------------------
---------------------------------
| explained_variance | 0.123    |
| fps                | 850      |
| nupdates           | 406700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.808    |
| fps                | 851      |
| nupdates           | 409500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2047500  |
| value_loss         | 5.4e-05  |
---------------------------------
---------------------------------
| explained_variance | -13.4    |
| fps                | 851      |
| nupdates           | 409600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2048000  |
| value_loss         | 0.000934 |
---------------------------------
---------------------------------
| explained_variance | 0.435    |
| fps                | 851      |
| nupdates           | 409700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2048500  |
| value_loss         | 0.000176 |
---------------------------------
---------------------------------
| explained_variance | 0.918    |
| fps                | 851      |
| nupdates           | 409800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.964    |
| fps                | 850      |
| nupdates           | 412500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2062500  |
| value_loss         | 0.000155 |
---------------------------------
---------------------------------
| explained_variance | -0.831   |
| fps                | 850      |
| nupdates           | 412600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2063000  |
| value_loss         | 0.000303 |
---------------------------------
---------------------------------
| explained_variance | 0.882    |
| fps                | 850      |
| nupdates           | 412700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2063500  |
| value_loss         | 2.55e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.06    |
| fps                | 850      |
| nupdates           | 412800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.842    |
| fps                | 850      |
| nupdates           | 415500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2077500  |
| value_loss         | 0.000204 |
---------------------------------
---------------------------------
| explained_variance | 0.125    |
| fps                | 850      |
| nupdates           | 415600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2078000  |
| value_loss         | 5.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.386    |
| fps                | 850      |
| nupdates           | 415700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2078500  |
| value_loss         | 0.926    |
---------------------------------
---------------------------------
| explained_variance | 0.137    |
| fps                | 850      |
| nupdates           | 415800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.981    |
| fps                | 850      |
| nupdates           | 418600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2093000  |
| value_loss         | 1.14e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.231   |
| fps                | 851      |
| nupdates           | 418700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2093500  |
| value_loss         | 0.000226 |
---------------------------------
---------------------------------
| explained_variance | 0.319    |
| fps                | 851      |
| nupdates           | 418800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2094000  |
| value_loss         | 4.2e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.192   |
| fps                | 851      |
| nupdates           | 418900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.82    |
| fps                | 850      |
| nupdates           | 421600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2108000  |
| value_loss         | 0.000135 |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 850      |
| nupdates           | 421700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2108500  |
| value_loss         | 6.73e-06 |
---------------------------------
---------------------------------
| explained_variance | -2.68    |
| fps                | 850      |
| nupdates           | 421800   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2109000  |
| value_loss         | 0.000963 |
---------------------------------
---------------------------------
| explained_variance | -0.0747  |
| fps                | 850      |
| nupdates           | 421900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.93     |
| fps                | 850      |
| nupdates           | 424700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2123500  |
| value_loss         | 3.74e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.88    |
| fps                | 850      |
| nupdates           | 424800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2124000  |
| value_loss         | 0.000288 |
---------------------------------
---------------------------------
| explained_variance | -8.28    |
| fps                | 850      |
| nupdates           | 424900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2124500  |
| value_loss         | 0.000685 |
---------------------------------
Eval num_timesteps=2125000, episode_reward=-5.00 +/- 0.00
Episode length: 549.30 +/- 161.34
---------------------------------
| explained_variance | -14.8    |
| fps                | 8

---------------------------------
| explained_variance | 0.0662   |
| fps                | 850      |
| nupdates           | 427700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2138500  |
| value_loss         | 0.000366 |
---------------------------------
---------------------------------
| explained_variance | 0.801    |
| fps                | 850      |
| nupdates           | 427800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2139000  |
| value_loss         | 7.3e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.51     |
| fps                | 850      |
| nupdates           | 427900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2139500  |
| value_loss         | 2.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.124   |
| fps                | 850      |
| nupdates           | 428000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.05    |
| fps                | 850      |
| nupdates           | 430700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2153500  |
| value_loss         | 0.000363 |
---------------------------------
---------------------------------
| explained_variance | 0.788    |
| fps                | 850      |
| nupdates           | 430800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2154000  |
| value_loss         | 0.000124 |
---------------------------------
---------------------------------
| explained_variance | 0.742    |
| fps                | 850      |
| nupdates           | 430900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2154500  |
| value_loss         | 7.41e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.89    |
| fps                | 850      |
| nupdates           | 431000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.567    |
| fps                | 850      |
| nupdates           | 433800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2169000  |
| value_loss         | 7.7e-05  |
---------------------------------
---------------------------------
| explained_variance | -1.29    |
| fps                | 850      |
| nupdates           | 433900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2169500  |
| value_loss         | 0.000998 |
---------------------------------
---------------------------------
| explained_variance | -0.283   |
| fps                | 850      |
| nupdates           | 434000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2170000  |
| value_loss         | 5.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.707    |
| fps                | 850      |
| nupdates           | 434100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.826    |
| fps                | 849      |
| nupdates           | 436800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2184000  |
| value_loss         | 0.000148 |
---------------------------------
---------------------------------
| explained_variance | 0.888    |
| fps                | 849      |
| nupdates           | 436900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2184500  |
| value_loss         | 5.27e-05 |
---------------------------------
---------------------------------
| explained_variance | -258     |
| fps                | 849      |
| nupdates           | 437000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2185000  |
| value_loss         | 0.0129   |
---------------------------------
---------------------------------
| explained_variance | -0.0829  |
| fps                | 849      |
| nupdates           | 437100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -13.4    |
| fps                | 850      |
| nupdates           | 439900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2199500  |
| value_loss         | 0.00148  |
---------------------------------
Eval num_timesteps=2200000, episode_reward=-4.80 +/- 0.40
Episode length: 720.30 +/- 115.14
---------------------------------
| explained_variance | 0.626    |
| fps                | 848      |
| nupdates           | 440000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2200000  |
| value_loss         | 0.000536 |
---------------------------------
---------------------------------
| explained_variance | -2.65    |
| fps                | 848      |
| nupdates           | 440100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2200500  |
| value_loss         | 0.000454 |
---------------------------------
---------------------------------
| explained_variance | -10      |
| fps                | 8

---------------------------------
| explained_variance | -0.321   |
| fps                | 849      |
| nupdates           | 442900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2214500  |
| value_loss         | 0.000214 |
---------------------------------
---------------------------------
| explained_variance | -0.559   |
| fps                | 849      |
| nupdates           | 443000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2215000  |
| value_loss         | 0.000528 |
---------------------------------
---------------------------------
| explained_variance | -585     |
| fps                | 849      |
| nupdates           | 443100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2215500  |
| value_loss         | 0.0898   |
---------------------------------
---------------------------------
| explained_variance | -0.743   |
| fps                | 849      |
| nupdates           | 443200   |
| policy_entropy     | 1.99     |
| total_timest

---------------------------------
| explained_variance | 0.889    |
| fps                | 848      |
| nupdates           | 445900   |
| policy_entropy     | 1.96     |
| total_timesteps    | 2229500  |
| value_loss         | 1.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.801    |
| fps                | 848      |
| nupdates           | 446000   |
| policy_entropy     | 1.98     |
| total_timesteps    | 2230000  |
| value_loss         | 0.000309 |
---------------------------------
---------------------------------
| explained_variance | 0.934    |
| fps                | 848      |
| nupdates           | 446100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2230500  |
| value_loss         | 5.59e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.824    |
| fps                | 848      |
| nupdates           | 446200   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.765    |
| fps                | 849      |
| nupdates           | 449000   |
| policy_entropy     | 2.01     |
| total_timesteps    | 2245000  |
| value_loss         | 8.26e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.985    |
| fps                | 849      |
| nupdates           | 449100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2245500  |
| value_loss         | 1.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.265    |
| fps                | 849      |
| nupdates           | 449200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2246000  |
| value_loss         | 0.262    |
---------------------------------
---------------------------------
| explained_variance | 0.449    |
| fps                | 849      |
| nupdates           | 449300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.989    |
| fps                | 849      |
| nupdates           | 452000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2260000  |
| value_loss         | 2.93e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.3     |
| fps                | 849      |
| nupdates           | 452100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2260500  |
| value_loss         | 0.000139 |
---------------------------------
---------------------------------
| explained_variance | -7.01    |
| fps                | 849      |
| nupdates           | 452200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2261000  |
| value_loss         | 0.00209  |
---------------------------------
---------------------------------
| explained_variance | -1.97    |
| fps                | 849      |
| nupdates           | 452300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.25    |
| fps                | 848      |
| nupdates           | 455100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2275500  |
| value_loss         | 0.000199 |
---------------------------------
---------------------------------
| explained_variance | -0.383   |
| fps                | 848      |
| nupdates           | 455200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2276000  |
| value_loss         | 0.000283 |
---------------------------------
---------------------------------
| explained_variance | 0.401    |
| fps                | 848      |
| nupdates           | 455300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2276500  |
| value_loss         | 0.000901 |
---------------------------------
---------------------------------
| explained_variance | -0.257   |
| fps                | 848      |
| nupdates           | 455400   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.93    |
| fps                | 849      |
| nupdates           | 458200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2291000  |
| value_loss         | 0.000657 |
---------------------------------
---------------------------------
| explained_variance | 0.677    |
| fps                | 849      |
| nupdates           | 458300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2291500  |
| value_loss         | 0.000158 |
---------------------------------
---------------------------------
| explained_variance | 0.91     |
| fps                | 849      |
| nupdates           | 458400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2292000  |
| value_loss         | 6.4e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.921    |
| fps                | 849      |
| nupdates           | 458500   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -6.83    |
| fps                | 849      |
| nupdates           | 461200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2306000  |
| value_loss         | 0.000383 |
---------------------------------
---------------------------------
| explained_variance | 0.945    |
| fps                | 849      |
| nupdates           | 461300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2306500  |
| value_loss         | 1.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.925    |
| fps                | 849      |
| nupdates           | 461400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2307000  |
| value_loss         | 0.000152 |
---------------------------------
---------------------------------
| explained_variance | 0.112    |
| fps                | 849      |
| nupdates           | 461500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -3.5     |
| fps                | 849      |
| nupdates           | 464300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2321500  |
| value_loss         | 0.00057  |
---------------------------------
---------------------------------
| explained_variance | 0.363    |
| fps                | 849      |
| nupdates           | 464400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2322000  |
| value_loss         | 0.000198 |
---------------------------------
---------------------------------
| explained_variance | 0.207    |
| fps                | 849      |
| nupdates           | 464500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2322500  |
| value_loss         | 0.000286 |
---------------------------------
---------------------------------
| explained_variance | 0.82     |
| fps                | 850      |
| nupdates           | 464600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.02    |
| fps                | 849      |
| nupdates           | 467300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2336500  |
| value_loss         | 0.00104  |
---------------------------------
---------------------------------
| explained_variance | 0.715    |
| fps                | 849      |
| nupdates           | 467400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2337000  |
| value_loss         | 0.00865  |
---------------------------------
---------------------------------
| explained_variance | -2.72    |
| fps                | 849      |
| nupdates           | 467500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2337500  |
| value_loss         | 0.000211 |
---------------------------------
---------------------------------
| explained_variance | 0.893    |
| fps                | 849      |
| nupdates           | 467600   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -6.29    |
| fps                | 849      |
| nupdates           | 470300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2351500  |
| value_loss         | 0.000724 |
---------------------------------
---------------------------------
| explained_variance | 0.41     |
| fps                | 849      |
| nupdates           | 470400   |
| policy_entropy     | 2.01     |
| total_timesteps    | 2352000  |
| value_loss         | 0.155    |
---------------------------------
---------------------------------
| explained_variance | -0.511   |
| fps                | 849      |
| nupdates           | 470500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2352500  |
| value_loss         | 9.05e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.248    |
| fps                | 849      |
| nupdates           | 470600   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.394    |
| fps                | 849      |
| nupdates           | 473400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2367000  |
| value_loss         | 0.000688 |
---------------------------------
---------------------------------
| explained_variance | -0.12    |
| fps                | 849      |
| nupdates           | 473500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2367500  |
| value_loss         | 0.000196 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 849      |
| nupdates           | 473600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2368000  |
| value_loss         | 9.82e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.52     |
| fps                | 849      |
| nupdates           | 473700   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.909   |
| fps                | 849      |
| nupdates           | 476400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2382000  |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | -0.896   |
| fps                | 849      |
| nupdates           | 476500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2382500  |
| value_loss         | 0.00105  |
---------------------------------
---------------------------------
| explained_variance | 0.428    |
| fps                | 849      |
| nupdates           | 476600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2383000  |
| value_loss         | 0.135    |
---------------------------------
---------------------------------
| explained_variance | 0.957    |
| fps                | 849      |
| nupdates           | 476700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.936    |
| fps                | 850      |
| nupdates           | 479500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2397500  |
| value_loss         | 5.77e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.106   |
| fps                | 850      |
| nupdates           | 479600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2398000  |
| value_loss         | 0.00035  |
---------------------------------
---------------------------------
| explained_variance | 0.969    |
| fps                | 850      |
| nupdates           | 479700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2398500  |
| value_loss         | 1.52e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.02    |
| fps                | 850      |
| nupdates           | 479800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.48    |
| fps                | 849      |
| nupdates           | 482500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2412500  |
| value_loss         | 0.00101  |
---------------------------------
---------------------------------
| explained_variance | 0.974    |
| fps                | 849      |
| nupdates           | 482600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2413000  |
| value_loss         | 9.41e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.849    |
| fps                | 849      |
| nupdates           | 482700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2413500  |
| value_loss         | 0.00015  |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 849      |
| nupdates           | 482800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.232    |
| fps                | 849      |
| nupdates           | 485500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2427500  |
| value_loss         | 5.4e-05  |
---------------------------------
----------------------------------
| explained_variance | -1.28e+04 |
| fps                | 849       |
| nupdates           | 485600    |
| policy_entropy     | 2.06      |
| total_timesteps    | 2428000   |
| value_loss         | 0.286     |
----------------------------------
---------------------------------
| explained_variance | 0.699    |
| fps                | 849      |
| nupdates           | 485700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2428500  |
| value_loss         | 0.000232 |
---------------------------------
---------------------------------
| explained_variance | -2.61    |
| fps                | 849      |
| nupdates           | 485800   |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | -2.35    |
| fps                | 849      |
| nupdates           | 488600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2443000  |
| value_loss         | 8.54e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.76     |
| fps                | 849      |
| nupdates           | 488700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2443500  |
| value_loss         | 9.38e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.794    |
| fps                | 849      |
| nupdates           | 488800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2444000  |
| value_loss         | 4.38e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.297   |
| fps                | 849      |
| nupdates           | 488900   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.151   |
| fps                | 849      |
| nupdates           | 491600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2458000  |
| value_loss         | 0.000121 |
---------------------------------
---------------------------------
| explained_variance | 0.904    |
| fps                | 849      |
| nupdates           | 491700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2458500  |
| value_loss         | 3.82e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.157    |
| fps                | 849      |
| nupdates           | 491800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2459000  |
| value_loss         | 0.000255 |
---------------------------------
---------------------------------
| explained_variance | -0.0158  |
| fps                | 849      |
| nupdates           | 491900   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -0.0475  |
| fps                | 850      |
| nupdates           | 494700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2473500  |
| value_loss         | 8.1e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.307   |
| fps                | 850      |
| nupdates           | 494800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2474000  |
| value_loss         | 0.000304 |
---------------------------------
---------------------------------
| explained_variance | 0.00168  |
| fps                | 850      |
| nupdates           | 494900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2474500  |
| value_loss         | 5.52e-05 |
---------------------------------
Eval num_timesteps=2475000, episode_reward=-5.00 +/- 0.00
Episode length: 588.30 +/- 71.93
---------------------------------
| explained_variance | -7.3     |
| fps                | 84

---------------------------------
| explained_variance | -5.29    |
| fps                | 849      |
| nupdates           | 497700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2488500  |
| value_loss         | 0.00212  |
---------------------------------
---------------------------------
| explained_variance | 0.934    |
| fps                | 849      |
| nupdates           | 497800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2489000  |
| value_loss         | 5.22e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.419   |
| fps                | 849      |
| nupdates           | 497900   |
| policy_entropy     | 1.96     |
| total_timesteps    | 2489500  |
| value_loss         | 0.00024  |
---------------------------------
---------------------------------
| explained_variance | 0.695    |
| fps                | 849      |
| nupdates           | 498000   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.971    |
| fps                | 849      |
| nupdates           | 500700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2503500  |
| value_loss         | 6.01e-05 |
---------------------------------
---------------------------------
| explained_variance | -8.02    |
| fps                | 849      |
| nupdates           | 500800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2504000  |
| value_loss         | 0.0033   |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 849      |
| nupdates           | 500900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2504500  |
| value_loss         | 1.54e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.368   |
| fps                | 849      |
| nupdates           | 501000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.926    |
| fps                | 850      |
| nupdates           | 503800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2519000  |
| value_loss         | 3.82e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.17    |
| fps                | 850      |
| nupdates           | 503900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2519500  |
| value_loss         | 0.00122  |
---------------------------------
---------------------------------
| explained_variance | 0.842    |
| fps                | 850      |
| nupdates           | 504000   |
| policy_entropy     | 2        |
| total_timesteps    | 2520000  |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | -1.27    |
| fps                | 850      |
| nupdates           | 504100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.27    |
| fps                | 849      |
| nupdates           | 506800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2534000  |
| value_loss         | 8.93e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.866    |
| fps                | 849      |
| nupdates           | 506900   |
| policy_entropy     | 2.01     |
| total_timesteps    | 2534500  |
| value_loss         | 0.000129 |
---------------------------------
---------------------------------
| explained_variance | -1.18    |
| fps                | 849      |
| nupdates           | 507000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2535000  |
| value_loss         | 2.68e-05 |
---------------------------------
---------------------------------
| explained_variance | -8.28    |
| fps                | 849      |
| nupdates           | 507100   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -10.6    |
| fps                | 850      |
| nupdates           | 509900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2549500  |
| value_loss         | 0.00018  |
---------------------------------
Eval num_timesteps=2550000, episode_reward=-4.90 +/- 0.30
Episode length: 601.30 +/- 106.92
---------------------------------
| explained_variance | -7.06    |
| fps                | 849      |
| nupdates           | 510000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2550000  |
| value_loss         | 0.00189  |
---------------------------------
---------------------------------
| explained_variance | 0.725    |
| fps                | 849      |
| nupdates           | 510100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2550500  |
| value_loss         | 0.000128 |
---------------------------------
---------------------------------
| explained_variance | -139     |
| fps                | 8

---------------------------------
| explained_variance | -0.613   |
| fps                | 849      |
| nupdates           | 512900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2564500  |
| value_loss         | 0.000129 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 849      |
| nupdates           | 513000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2565000  |
| value_loss         | 1.41e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.461   |
| fps                | 849      |
| nupdates           | 513100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2565500  |
| value_loss         | 0.00049  |
---------------------------------
---------------------------------
| explained_variance | 0.663    |
| fps                | 849      |
| nupdates           | 513200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0249   |
| fps                | 848      |
| nupdates           | 515900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2579500  |
| value_loss         | 8.3e-05  |
---------------------------------
---------------------------------
| explained_variance | -3.25    |
| fps                | 848      |
| nupdates           | 516000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2580000  |
| value_loss         | 8.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.871    |
| fps                | 848      |
| nupdates           | 516100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2580500  |
| value_loss         | 3.59e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0127  |
| fps                | 848      |
| nupdates           | 516200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.08    |
| fps                | 849      |
| nupdates           | 519000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2595000  |
| value_loss         | 6.16e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.246   |
| fps                | 849      |
| nupdates           | 519100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2595500  |
| value_loss         | 0.00035  |
---------------------------------
---------------------------------
| explained_variance | 0.978    |
| fps                | 849      |
| nupdates           | 519200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2596000  |
| value_loss         | 9.53e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.813    |
| fps                | 849      |
| nupdates           | 519300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -6.7     |
| fps                | 848      |
| nupdates           | 522000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2610000  |
| value_loss         | 0.000235 |
---------------------------------
---------------------------------
| explained_variance | -0.442   |
| fps                | 848      |
| nupdates           | 522100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2610500  |
| value_loss         | 0.000592 |
---------------------------------
---------------------------------
| explained_variance | -0.245   |
| fps                | 848      |
| nupdates           | 522200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2611000  |
| value_loss         | 0.000114 |
---------------------------------
---------------------------------
| explained_variance | 0.304    |
| fps                | 848      |
| nupdates           | 522300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.0307  |
| fps                | 848      |
| nupdates           | 525100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2625500  |
| value_loss         | 0.241    |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 848      |
| nupdates           | 525200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2626000  |
| value_loss         | 1.27e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.779   |
| fps                | 848      |
| nupdates           | 525300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2626500  |
| value_loss         | 7.19e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.363    |
| fps                | 848      |
| nupdates           | 525400   |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | -3.88    |
| fps                | 849      |
| nupdates           | 528200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2641000  |
| value_loss         | 0.0028   |
---------------------------------
---------------------------------
| explained_variance | -7.46    |
| fps                | 849      |
| nupdates           | 528300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2641500  |
| value_loss         | 0.000187 |
---------------------------------
---------------------------------
| explained_variance | -1.08    |
| fps                | 849      |
| nupdates           | 528400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2642000  |
| value_loss         | 0.000117 |
---------------------------------
---------------------------------
| explained_variance | 0.634    |
| fps                | 849      |
| nupdates           | 528500   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.348   |
| fps                | 848      |
| nupdates           | 531200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2656000  |
| value_loss         | 0.00167  |
---------------------------------
---------------------------------
| explained_variance | 0.893    |
| fps                | 848      |
| nupdates           | 531300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2656500  |
| value_loss         | 7.94e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.74    |
| fps                | 848      |
| nupdates           | 531400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2657000  |
| value_loss         | 7.54e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.64    |
| fps                | 848      |
| nupdates           | 531500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.4e+03 |
| fps                | 849      |
| nupdates           | 534300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2671500  |
| value_loss         | 0.0912   |
---------------------------------
---------------------------------
| explained_variance | -0.0109  |
| fps                | 849      |
| nupdates           | 534400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2672000  |
| value_loss         | 0.156    |
---------------------------------
---------------------------------
| explained_variance | 0.96     |
| fps                | 849      |
| nupdates           | 534500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2672500  |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | -0.0392  |
| fps                | 849      |
| nupdates           | 534600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.413    |
| fps                | 848      |
| nupdates           | 537300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2686500  |
| value_loss         | 0.146    |
---------------------------------
---------------------------------
| explained_variance | 0.948    |
| fps                | 848      |
| nupdates           | 537400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2687000  |
| value_loss         | 0.00015  |
---------------------------------
---------------------------------
| explained_variance | 0.79     |
| fps                | 848      |
| nupdates           | 537500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2687500  |
| value_loss         | 5.2e-06  |
---------------------------------
---------------------------------
| explained_variance | -2.41    |
| fps                | 848      |
| nupdates           | 537600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.824    |
| fps                | 848      |
| nupdates           | 540300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2701500  |
| value_loss         | 5.46e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.933    |
| fps                | 848      |
| nupdates           | 540400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2702000  |
| value_loss         | 1.43e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.808    |
| fps                | 848      |
| nupdates           | 540500   |
| policy_entropy     | 2.01     |
| total_timesteps    | 2702500  |
| value_loss         | 9.12e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.0811  |
| fps                | 848      |
| nupdates           | 540600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.26    |
| fps                | 849      |
| nupdates           | 543400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2717000  |
| value_loss         | 0.000198 |
---------------------------------
---------------------------------
| explained_variance | -12.4    |
| fps                | 849      |
| nupdates           | 543500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2717500  |
| value_loss         | 0.000394 |
---------------------------------
---------------------------------
| explained_variance | 0.26     |
| fps                | 849      |
| nupdates           | 543600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2718000  |
| value_loss         | 0.00011  |
---------------------------------
---------------------------------
| explained_variance | 0.211    |
| fps                | 849      |
| nupdates           | 543700   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -9.9     |
| fps                | 849      |
| nupdates           | 546400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2732000  |
| value_loss         | 0.000487 |
---------------------------------
---------------------------------
| explained_variance | 0.591    |
| fps                | 849      |
| nupdates           | 546500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2732500  |
| value_loss         | 0.000169 |
---------------------------------
---------------------------------
| explained_variance | 0.654    |
| fps                | 849      |
| nupdates           | 546600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2733000  |
| value_loss         | 3.4e-05  |
---------------------------------
---------------------------------
| explained_variance | -8.12    |
| fps                | 849      |
| nupdates           | 546700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.00888  |
| fps                | 849      |
| nupdates           | 549500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2747500  |
| value_loss         | 3.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.612    |
| fps                | 849      |
| nupdates           | 549600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2748000  |
| value_loss         | 0.000269 |
---------------------------------
---------------------------------
| explained_variance | 0.647    |
| fps                | 849      |
| nupdates           | 549700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2748500  |
| value_loss         | 1.84e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.861    |
| fps                | 849      |
| nupdates           | 549800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.942    |
| fps                | 849      |
| nupdates           | 552500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2762500  |
| value_loss         | 5.76e-06 |
---------------------------------
---------------------------------
| explained_variance | -2.78    |
| fps                | 849      |
| nupdates           | 552600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2763000  |
| value_loss         | 0.00042  |
---------------------------------
---------------------------------
| explained_variance | -3.81    |
| fps                | 849      |
| nupdates           | 552700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2763500  |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | 0.671    |
| fps                | 849      |
| nupdates           | 552800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.742    |
| fps                | 849      |
| nupdates           | 555500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2777500  |
| value_loss         | 8.99e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.835    |
| fps                | 849      |
| nupdates           | 555600   |
| policy_entropy     | 2.01     |
| total_timesteps    | 2778000  |
| value_loss         | 0.000212 |
---------------------------------
---------------------------------
| explained_variance | 0.294    |
| fps                | 849      |
| nupdates           | 555700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2778500  |
| value_loss         | 0.000329 |
---------------------------------
---------------------------------
| explained_variance | 0.284    |
| fps                | 849      |
| nupdates           | 555800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.081   |
| fps                | 849      |
| nupdates           | 558600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2793000  |
| value_loss         | 0.000268 |
---------------------------------
---------------------------------
| explained_variance | -0.663   |
| fps                | 849      |
| nupdates           | 558700   |
| policy_entropy     | 2.01     |
| total_timesteps    | 2793500  |
| value_loss         | 0.000466 |
---------------------------------
---------------------------------
| explained_variance | 0.852    |
| fps                | 850      |
| nupdates           | 558800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2794000  |
| value_loss         | 3.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.942    |
| fps                | 850      |
| nupdates           | 558900   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.994    |
| fps                | 849      |
| nupdates           | 561600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2808000  |
| value_loss         | 6.8e-06  |
---------------------------------
---------------------------------
| explained_variance | -2.98    |
| fps                | 849      |
| nupdates           | 561700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2808500  |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | -81.3    |
| fps                | 849      |
| nupdates           | 561800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2809000  |
| value_loss         | 0.024    |
---------------------------------
---------------------------------
| explained_variance | -1.57    |
| fps                | 849      |
| nupdates           | 561900   |
| policy_entropy     | 2.05     |
| total_timest

----------------------------------
| explained_variance | -1.07e+04 |
| fps                | 850       |
| nupdates           | 564700    |
| policy_entropy     | 2.05      |
| total_timesteps    | 2823500   |
| value_loss         | 0.0982    |
----------------------------------
---------------------------------
| explained_variance | -0.758   |
| fps                | 850      |
| nupdates           | 564800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2824000  |
| value_loss         | 0.000398 |
---------------------------------
---------------------------------
| explained_variance | 0.939    |
| fps                | 850      |
| nupdates           | 564900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2824500  |
| value_loss         | 9.8e-05  |
---------------------------------
Eval num_timesteps=2825000, episode_reward=-4.90 +/- 0.30
Episode length: 681.20 +/- 177.49
---------------------------------
| explained_variance | 0.721    |
| fps           

---------------------------------
| explained_variance | 0.719    |
| fps                | 849      |
| nupdates           | 567700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2838500  |
| value_loss         | 4.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.196    |
| fps                | 849      |
| nupdates           | 567800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2839000  |
| value_loss         | 0.145    |
---------------------------------
---------------------------------
| explained_variance | 0.704    |
| fps                | 849      |
| nupdates           | 567900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2839500  |
| value_loss         | 1.89e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.53    |
| fps                | 849      |
| nupdates           | 568000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.603    |
| fps                | 848      |
| nupdates           | 570700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2853500  |
| value_loss         | 0.000157 |
---------------------------------
---------------------------------
| explained_variance | -0.434   |
| fps                | 848      |
| nupdates           | 570800   |
| policy_entropy     | 2        |
| total_timesteps    | 2854000  |
| value_loss         | 0.00135  |
---------------------------------
---------------------------------
| explained_variance | -23.6    |
| fps                | 848      |
| nupdates           | 570900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2854500  |
| value_loss         | 0.000575 |
---------------------------------
---------------------------------
| explained_variance | -5.78    |
| fps                | 848      |
| nupdates           | 571000   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.995    |
| fps                | 849      |
| nupdates           | 573800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2869000  |
| value_loss         | 3.27e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.265   |
| fps                | 849      |
| nupdates           | 573900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2869500  |
| value_loss         | 0.000831 |
---------------------------------
---------------------------------
| explained_variance | 0.465    |
| fps                | 849      |
| nupdates           | 574000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2870000  |
| value_loss         | 5.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.123    |
| fps                | 849      |
| nupdates           | 574100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.365    |
| fps                | 848      |
| nupdates           | 576800   |
| policy_entropy     | 2.01     |
| total_timesteps    | 2884000  |
| value_loss         | 0.099    |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 848      |
| nupdates           | 576900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2884500  |
| value_loss         | 3.19e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.535    |
| fps                | 848      |
| nupdates           | 577000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2885000  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | -0.0119  |
| fps                | 848      |
| nupdates           | 577100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.797    |
| fps                | 848      |
| nupdates           | 579900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2899500  |
| value_loss         | 2.38e-05 |
---------------------------------
Eval num_timesteps=2900000, episode_reward=-4.80 +/- 0.40
Episode length: 634.00 +/- 148.33
---------------------------------
| explained_variance | -0.0445  |
| fps                | 847      |
| nupdates           | 580000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2900000  |
| value_loss         | 7.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.352    |
| fps                | 847      |
| nupdates           | 580100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2900500  |
| value_loss         | 8.16e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.578   |
| fps                | 8

---------------------------------
| explained_variance | -6.48    |
| fps                | 847      |
| nupdates           | 582900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2914500  |
| value_loss         | 0.00113  |
---------------------------------
---------------------------------
| explained_variance | 0.423    |
| fps                | 847      |
| nupdates           | 583000   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2915000  |
| value_loss         | 0.000323 |
---------------------------------
---------------------------------
| explained_variance | 0.85     |
| fps                | 847      |
| nupdates           | 583100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2915500  |
| value_loss         | 0.000153 |
---------------------------------
---------------------------------
| explained_variance | -0.00798 |
| fps                | 847      |
| nupdates           | 583200   |
| policy_entropy     | 1.97     |
| total_timest

---------------------------------
| explained_variance | 0.704    |
| fps                | 847      |
| nupdates           | 585900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2929500  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | -1.32    |
| fps                | 847      |
| nupdates           | 586000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2930000  |
| value_loss         | 8.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.968    |
| fps                | 847      |
| nupdates           | 586100   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2930500  |
| value_loss         | 5.17e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.733    |
| fps                | 847      |
| nupdates           | 586200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.924    |
| fps                | 847      |
| nupdates           | 589000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2945000  |
| value_loss         | 3.4e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.397    |
| fps                | 847      |
| nupdates           | 589100   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2945500  |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | 0.41     |
| fps                | 847      |
| nupdates           | 589200   |
| policy_entropy     | 2.01     |
| total_timesteps    | 2946000  |
| value_loss         | 0.144    |
---------------------------------
---------------------------------
| explained_variance | 0.877    |
| fps                | 847      |
| nupdates           | 589300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.88     |
| fps                | 846      |
| nupdates           | 592000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2960000  |
| value_loss         | 7.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.736    |
| fps                | 846      |
| nupdates           | 592100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2960500  |
| value_loss         | 5.41e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.199   |
| fps                | 846      |
| nupdates           | 592200   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2961000  |
| value_loss         | 0.000354 |
---------------------------------
---------------------------------
| explained_variance | 0.962    |
| fps                | 846      |
| nupdates           | 592300   |
| policy_entropy     | 1.91     |
| total_timest

----------------------------------
| explained_variance | -3.34e+03 |
| fps                | 846       |
| nupdates           | 595100    |
| policy_entropy     | 2.05      |
| total_timesteps    | 2975500   |
| value_loss         | 0.131     |
----------------------------------
---------------------------------
| explained_variance | 0.827    |
| fps                | 846      |
| nupdates           | 595200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2976000  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | 0.674    |
| fps                | 846      |
| nupdates           | 595300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2976500  |
| value_loss         | 1.97e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.796    |
| fps                | 846      |
| nupdates           | 595400   |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | 0.999    |
| fps                | 846      |
| nupdates           | 598200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2991000  |
| value_loss         | 1.71e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.491   |
| fps                | 846      |
| nupdates           | 598300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2991500  |
| value_loss         | 0.000167 |
---------------------------------
---------------------------------
| explained_variance | -1.35    |
| fps                | 846      |
| nupdates           | 598400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2992000  |
| value_loss         | 2.67e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.858    |
| fps                | 846      |
| nupdates           | 598500   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.911    |
| fps                | 845      |
| nupdates           | 601200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3006000  |
| value_loss         | 9.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.545    |
| fps                | 845      |
| nupdates           | 601300   |
| policy_entropy     | 2.02     |
| total_timesteps    | 3006500  |
| value_loss         | 9.69e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.733   |
| fps                | 845      |
| nupdates           | 601400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3007000  |
| value_loss         | 7.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.662    |
| fps                | 845      |
| nupdates           | 601500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -23      |
| fps                | 845      |
| nupdates           | 604300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3021500  |
| value_loss         | 0.00112  |
---------------------------------
---------------------------------
| explained_variance | 0.234    |
| fps                | 845      |
| nupdates           | 604400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3022000  |
| value_loss         | 0.000168 |
---------------------------------
---------------------------------
| explained_variance | 0.0167   |
| fps                | 845      |
| nupdates           | 604500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3022500  |
| value_loss         | 3.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.987    |
| fps                | 845      |
| nupdates           | 604600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.986    |
| fps                | 845      |
| nupdates           | 607300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3036500  |
| value_loss         | 1.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.51     |
| fps                | 845      |
| nupdates           | 607400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3037000  |
| value_loss         | 3.17e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0023  |
| fps                | 845      |
| nupdates           | 607500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3037500  |
| value_loss         | 0.000722 |
---------------------------------
---------------------------------
| explained_variance | 0.799    |
| fps                | 845      |
| nupdates           | 607600   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.874    |
| fps                | 844      |
| nupdates           | 610300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3051500  |
| value_loss         | 1.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.545    |
| fps                | 844      |
| nupdates           | 610400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3052000  |
| value_loss         | 0.000174 |
---------------------------------
---------------------------------
| explained_variance | 0.769    |
| fps                | 844      |
| nupdates           | 610500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3052500  |
| value_loss         | 9.72e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.25    |
| fps                | 844      |
| nupdates           | 610600   |
| policy_entropy     | 1.92     |
| total_timest

---------------------------------
| explained_variance | 0.0102   |
| fps                | 845      |
| nupdates           | 613400   |
| policy_entropy     | 2.01     |
| total_timesteps    | 3067000  |
| value_loss         | 0.000729 |
---------------------------------
---------------------------------
| explained_variance | 0.827    |
| fps                | 845      |
| nupdates           | 613500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3067500  |
| value_loss         | 0.000325 |
---------------------------------
---------------------------------
| explained_variance | -0.498   |
| fps                | 845      |
| nupdates           | 613600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3068000  |
| value_loss         | 9.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.963    |
| fps                | 845      |
| nupdates           | 613700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.589    |
| fps                | 844      |
| nupdates           | 616400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3082000  |
| value_loss         | 0.000118 |
---------------------------------
----------------------------------
| explained_variance | -1.69e+03 |
| fps                | 844       |
| nupdates           | 616500    |
| policy_entropy     | 1.93      |
| total_timesteps    | 3082500   |
| value_loss         | 0.0361    |
----------------------------------
---------------------------------
| explained_variance | -40.9    |
| fps                | 844      |
| nupdates           | 616600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3083000  |
| value_loss         | 0.0029   |
---------------------------------
---------------------------------
| explained_variance | 0.682    |
| fps                | 844      |
| nupdates           | 616700   |
| policy_entropy     | 2.05     |
| tota

---------------------------------
| explained_variance | 0.915    |
| fps                | 845      |
| nupdates           | 619500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3097500  |
| value_loss         | 9.65e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.0316   |
| fps                | 845      |
| nupdates           | 619600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3098000  |
| value_loss         | 0.000267 |
---------------------------------
---------------------------------
| explained_variance | -0.0151  |
| fps                | 845      |
| nupdates           | 619700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3098500  |
| value_loss         | 0.00116  |
---------------------------------
---------------------------------
| explained_variance | -1.56    |
| fps                | 845      |
| nupdates           | 619800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.955    |
| fps                | 845      |
| nupdates           | 622500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3112500  |
| value_loss         | 2.51e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.542    |
| fps                | 845      |
| nupdates           | 622600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3113000  |
| value_loss         | 8.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 845      |
| nupdates           | 622700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3113500  |
| value_loss         | 4.22e-06 |
---------------------------------
---------------------------------
| explained_variance | -14      |
| fps                | 845      |
| nupdates           | 622800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.772    |
| fps                | 844      |
| nupdates           | 625500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3127500  |
| value_loss         | 2.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.469    |
| fps                | 844      |
| nupdates           | 625600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3128000  |
| value_loss         | 4.9e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 844      |
| nupdates           | 625700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3128500  |
| value_loss         | 1.03e-06 |
---------------------------------
---------------------------------
| explained_variance | -3.12    |
| fps                | 844      |
| nupdates           | 625800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -8.37    |
| fps                | 845      |
| nupdates           | 628600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3143000  |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | 0.902    |
| fps                | 845      |
| nupdates           | 628700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3143500  |
| value_loss         | 4.5e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.0612  |
| fps                | 845      |
| nupdates           | 628800   |
| policy_entropy     | 1.97     |
| total_timesteps    | 3144000  |
| value_loss         | 0.000534 |
---------------------------------
---------------------------------
| explained_variance | 0.961    |
| fps                | 845      |
| nupdates           | 628900   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.83     |
| fps                | 845      |
| nupdates           | 631600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3158000  |
| value_loss         | 5.2e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.982    |
| fps                | 845      |
| nupdates           | 631700   |
| policy_entropy     | 2.01     |
| total_timesteps    | 3158500  |
| value_loss         | 7.99e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.00534  |
| fps                | 845      |
| nupdates           | 631800   |
| policy_entropy     | 1.92     |
| total_timesteps    | 3159000  |
| value_loss         | 0.929    |
---------------------------------
---------------------------------
| explained_variance | -0.239   |
| fps                | 845      |
| nupdates           | 631900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.325   |
| fps                | 845      |
| nupdates           | 634700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3173500  |
| value_loss         | 5.1e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.376    |
| fps                | 845      |
| nupdates           | 634800   |
| policy_entropy     | 1.83     |
| total_timesteps    | 3174000  |
| value_loss         | 0.147    |
---------------------------------
---------------------------------
| explained_variance | 0.968    |
| fps                | 845      |
| nupdates           | 634900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3174500  |
| value_loss         | 1.05e-05 |
---------------------------------
Eval num_timesteps=3175000, episode_reward=-4.80 +/- 0.60
Episode length: 573.70 +/- 101.37
---------------------------------
| explained_variance | 0.219    |
| fps                | 8

---------------------------------
| explained_variance | -49      |
| fps                | 844      |
| nupdates           | 637700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3188500  |
| value_loss         | 0.0033   |
---------------------------------
---------------------------------
| explained_variance | 0.306    |
| fps                | 844      |
| nupdates           | 637800   |
| policy_entropy     | 1.78     |
| total_timesteps    | 3189000  |
| value_loss         | 0.209    |
---------------------------------
---------------------------------
| explained_variance | 0.987    |
| fps                | 844      |
| nupdates           | 637900   |
| policy_entropy     | 1.93     |
| total_timesteps    | 3189500  |
| value_loss         | 0.0198   |
---------------------------------
---------------------------------
| explained_variance | 0.206    |
| fps                | 844      |
| nupdates           | 638000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.116   |
| fps                | 844      |
| nupdates           | 640700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3203500  |
| value_loss         | 0.000162 |
---------------------------------
---------------------------------
| explained_variance | 0.755    |
| fps                | 844      |
| nupdates           | 640800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3204000  |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | 0.813    |
| fps                | 844      |
| nupdates           | 640900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3204500  |
| value_loss         | 5.33e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.606   |
| fps                | 844      |
| nupdates           | 641000   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.984    |
| fps                | 845      |
| nupdates           | 643800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3219000  |
| value_loss         | 1.1e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.0539   |
| fps                | 845      |
| nupdates           | 643900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3219500  |
| value_loss         | 0.00035  |
---------------------------------
---------------------------------
| explained_variance | -9.68    |
| fps                | 845      |
| nupdates           | 644000   |
| policy_entropy     | 1.96     |
| total_timesteps    | 3220000  |
| value_loss         | 0.15     |
---------------------------------
---------------------------------
| explained_variance | -2.85    |
| fps                | 845      |
| nupdates           | 644100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -5.72    |
| fps                | 844      |
| nupdates           | 646800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3234000  |
| value_loss         | 0.00287  |
---------------------------------
---------------------------------
| explained_variance | 0.976    |
| fps                | 844      |
| nupdates           | 646900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3234500  |
| value_loss         | 7.14e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.985    |
| fps                | 844      |
| nupdates           | 647000   |
| policy_entropy     | 1.74     |
| total_timesteps    | 3235000  |
| value_loss         | 0.00136  |
---------------------------------
---------------------------------
| explained_variance | 0.655    |
| fps                | 844      |
| nupdates           | 647100   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.188    |
| fps                | 845      |
| nupdates           | 649900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3249500  |
| value_loss         | 6.94e-05 |
---------------------------------
Eval num_timesteps=3250000, episode_reward=-4.80 +/- 0.60
Episode length: 558.50 +/- 143.04
---------------------------------
| explained_variance | -858     |
| fps                | 844      |
| nupdates           | 650000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3250000  |
| value_loss         | 0.0174   |
---------------------------------
---------------------------------
| explained_variance | 0.143    |
| fps                | 844      |
| nupdates           | 650100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3250500  |
| value_loss         | 0.000286 |
---------------------------------
---------------------------------
| explained_variance | -11.2    |
| fps                | 8

---------------------------------
| explained_variance | -1.1     |
| fps                | 844      |
| nupdates           | 652900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3264500  |
| value_loss         | 0.00117  |
---------------------------------
---------------------------------
| explained_variance | 0.695    |
| fps                | 844      |
| nupdates           | 653000   |
| policy_entropy     | 2.02     |
| total_timesteps    | 3265000  |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | -0.561   |
| fps                | 844      |
| nupdates           | 653100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3265500  |
| value_loss         | 0.000447 |
---------------------------------
---------------------------------
| explained_variance | -1       |
| fps                | 844      |
| nupdates           | 653200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -4.67    |
| fps                | 844      |
| nupdates           | 655900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3279500  |
| value_loss         | 0.000135 |
---------------------------------
---------------------------------
| explained_variance | -0.131   |
| fps                | 844      |
| nupdates           | 656000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3280000  |
| value_loss         | 0.000875 |
---------------------------------
---------------------------------
| explained_variance | -0.988   |
| fps                | 844      |
| nupdates           | 656100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3280500  |
| value_loss         | 0.000585 |
---------------------------------
---------------------------------
| explained_variance | -0.0997  |
| fps                | 844      |
| nupdates           | 656200   |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.107    |
| fps                | 845      |
| nupdates           | 659000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3295000  |
| value_loss         | 0.000115 |
---------------------------------
---------------------------------
| explained_variance | 0.978    |
| fps                | 845      |
| nupdates           | 659100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3295500  |
| value_loss         | 4.14e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 845      |
| nupdates           | 659200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3296000  |
| value_loss         | 2.53e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.44    |
| fps                | 845      |
| nupdates           | 659300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.486    |
| fps                | 844      |
| nupdates           | 662000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3310000  |
| value_loss         | 0.000209 |
---------------------------------
---------------------------------
| explained_variance | 0.777    |
| fps                | 844      |
| nupdates           | 662100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3310500  |
| value_loss         | 0.000386 |
---------------------------------
---------------------------------
| explained_variance | 0.285    |
| fps                | 844      |
| nupdates           | 662200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3311000  |
| value_loss         | 0.118    |
---------------------------------
---------------------------------
| explained_variance | -0.873   |
| fps                | 844      |
| nupdates           | 662300   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -0.773   |
| fps                | 844      |
| nupdates           | 665100   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3325500  |
| value_loss         | 0.000761 |
---------------------------------
---------------------------------
| explained_variance | 0.256    |
| fps                | 844      |
| nupdates           | 665200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3326000  |
| value_loss         | 5.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.929    |
| fps                | 844      |
| nupdates           | 665300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3326500  |
| value_loss         | 1.57e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.947    |
| fps                | 844      |
| nupdates           | 665400   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.513    |
| fps                | 844      |
| nupdates           | 668200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3341000  |
| value_loss         | 2.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.405    |
| fps                | 844      |
| nupdates           | 668300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3341500  |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | -2.14    |
| fps                | 844      |
| nupdates           | 668400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3342000  |
| value_loss         | 0.000877 |
---------------------------------
---------------------------------
| explained_variance | -0.452   |
| fps                | 844      |
| nupdates           | 668500   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.576    |
| fps                | 844      |
| nupdates           | 671200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3356000  |
| value_loss         | 9.39e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 844      |
| nupdates           | 671300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3356500  |
| value_loss         | 1.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.947    |
| fps                | 844      |
| nupdates           | 671400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3357000  |
| value_loss         | 5.51e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0535  |
| fps                | 844      |
| nupdates           | 671500   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.701    |
| fps                | 845      |
| nupdates           | 674300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3371500  |
| value_loss         | 0.000159 |
---------------------------------
---------------------------------
| explained_variance | -28      |
| fps                | 845      |
| nupdates           | 674400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3372000  |
| value_loss         | 0.0114   |
---------------------------------
---------------------------------
| explained_variance | 0.453    |
| fps                | 845      |
| nupdates           | 674500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3372500  |
| value_loss         | 2.49e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.193   |
| fps                | 845      |
| nupdates           | 674600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.867    |
| fps                | 844      |
| nupdates           | 677300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3386500  |
| value_loss         | 7.82e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.665    |
| fps                | 844      |
| nupdates           | 677400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3387000  |
| value_loss         | 4.35e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.606    |
| fps                | 844      |
| nupdates           | 677500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3387500  |
| value_loss         | 0.000468 |
---------------------------------
---------------------------------
| explained_variance | 0.935    |
| fps                | 844      |
| nupdates           | 677600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.972    |
| fps                | 844      |
| nupdates           | 680300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3401500  |
| value_loss         | 3.09e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.97    |
| fps                | 844      |
| nupdates           | 680400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3402000  |
| value_loss         | 0.000907 |
---------------------------------
---------------------------------
| explained_variance | 0.0271   |
| fps                | 844      |
| nupdates           | 680500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3402500  |
| value_loss         | 0.000571 |
---------------------------------
---------------------------------
| explained_variance | -5.19    |
| fps                | 844      |
| nupdates           | 680600   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.453    |
| fps                | 845      |
| nupdates           | 683400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3417000  |
| value_loss         | 4.09e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.629    |
| fps                | 845      |
| nupdates           | 683500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3417500  |
| value_loss         | 4.52e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.597    |
| fps                | 845      |
| nupdates           | 683600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3418000  |
| value_loss         | 0.000164 |
---------------------------------
---------------------------------
| explained_variance | 0.94     |
| fps                | 845      |
| nupdates           | 683700   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.691    |
| fps                | 844      |
| nupdates           | 686400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3432000  |
| value_loss         | 7.51e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.419   |
| fps                | 844      |
| nupdates           | 686500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3432500  |
| value_loss         | 8.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.601    |
| fps                | 844      |
| nupdates           | 686600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3433000  |
| value_loss         | 0.000104 |
---------------------------------
---------------------------------
| explained_variance | -6.93    |
| fps                | 844      |
| nupdates           | 686700   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -7.52    |
| fps                | 845      |
| nupdates           | 689500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3447500  |
| value_loss         | 0.000264 |
---------------------------------
---------------------------------
| explained_variance | 0.886    |
| fps                | 845      |
| nupdates           | 689600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3448000  |
| value_loss         | 6.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.742    |
| fps                | 845      |
| nupdates           | 689700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3448500  |
| value_loss         | 0.000397 |
---------------------------------
---------------------------------
| explained_variance | 0.796    |
| fps                | 845      |
| nupdates           | 689800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.603    |
| fps                | 844      |
| nupdates           | 692500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3462500  |
| value_loss         | 6.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.688    |
| fps                | 844      |
| nupdates           | 692600   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3463000  |
| value_loss         | 0.000392 |
---------------------------------
---------------------------------
| explained_variance | -7.48    |
| fps                | 844      |
| nupdates           | 692700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3463500  |
| value_loss         | 0.00402  |
---------------------------------
---------------------------------
| explained_variance | -1.17    |
| fps                | 844      |
| nupdates           | 692800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.781    |
| fps                | 844      |
| nupdates           | 695500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3477500  |
| value_loss         | 2.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.961    |
| fps                | 844      |
| nupdates           | 695600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3478000  |
| value_loss         | 1.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.67     |
| fps                | 844      |
| nupdates           | 695700   |
| policy_entropy     | 2.01     |
| total_timesteps    | 3478500  |
| value_loss         | 0.000357 |
---------------------------------
---------------------------------
| explained_variance | -0.377   |
| fps                | 844      |
| nupdates           | 695800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -21.9    |
| fps                | 844      |
| nupdates           | 698600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3493000  |
| value_loss         | 0.000632 |
---------------------------------
---------------------------------
| explained_variance | -45.6    |
| fps                | 844      |
| nupdates           | 698700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3493500  |
| value_loss         | 0.00854  |
---------------------------------
---------------------------------
| explained_variance | -1.99    |
| fps                | 844      |
| nupdates           | 698800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3494000  |
| value_loss         | 0.000271 |
---------------------------------
---------------------------------
| explained_variance | 0.975    |
| fps                | 844      |
| nupdates           | 698900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.982    |
| fps                | 844      |
| nupdates           | 701600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3508000  |
| value_loss         | 1.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.433    |
| fps                | 844      |
| nupdates           | 701700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3508500  |
| value_loss         | 4.62e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.2      |
| fps                | 844      |
| nupdates           | 701800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3509000  |
| value_loss         | 0.00125  |
---------------------------------
---------------------------------
| explained_variance | 0.619    |
| fps                | 844      |
| nupdates           | 701900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.757    |
| fps                | 845      |
| nupdates           | 704700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3523500  |
| value_loss         | 0.000128 |
---------------------------------
---------------------------------
| explained_variance | -0.635   |
| fps                | 845      |
| nupdates           | 704800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3524000  |
| value_loss         | 3.57e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.56    |
| fps                | 845      |
| nupdates           | 704900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3524500  |
| value_loss         | 0.000325 |
---------------------------------
Eval num_timesteps=3525000, episode_reward=-4.70 +/- 0.46
Episode length: 625.70 +/- 122.65
---------------------------------
| explained_variance | 0.842    |
| fps                | 8

---------------------------------
| explained_variance | 0.693    |
| fps                | 844      |
| nupdates           | 707700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3538500  |
| value_loss         | 5.82e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.787    |
| fps                | 844      |
| nupdates           | 707800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3539000  |
| value_loss         | 6.59e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.842    |
| fps                | 844      |
| nupdates           | 707900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3539500  |
| value_loss         | 5.4e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.0331  |
| fps                | 844      |
| nupdates           | 708000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.863    |
| fps                | 844      |
| nupdates           | 710700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3553500  |
| value_loss         | 4.31e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.948   |
| fps                | 844      |
| nupdates           | 710800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3554000  |
| value_loss         | 0.00227  |
---------------------------------
---------------------------------
| explained_variance | 0.903    |
| fps                | 844      |
| nupdates           | 710900   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3554500  |
| value_loss         | 3.59e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.654    |
| fps                | 844      |
| nupdates           | 711000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.0377   |
| fps                | 845      |
| nupdates           | 713800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3569000  |
| value_loss         | 0.000121 |
---------------------------------
---------------------------------
| explained_variance | 0.97     |
| fps                | 845      |
| nupdates           | 713900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3569500  |
| value_loss         | 3.45e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.559    |
| fps                | 845      |
| nupdates           | 714000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3570000  |
| value_loss         | 0.000104 |
---------------------------------
---------------------------------
| explained_variance | 0.96     |
| fps                | 845      |
| nupdates           | 714100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.672    |
| fps                | 845      |
| nupdates           | 716800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3584000  |
| value_loss         | 4.9e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.942    |
| fps                | 845      |
| nupdates           | 716900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3584500  |
| value_loss         | 2.89e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.95     |
| fps                | 845      |
| nupdates           | 717000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3585000  |
| value_loss         | 3.6e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.782    |
| fps                | 845      |
| nupdates           | 717100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -6.06    |
| fps                | 845      |
| nupdates           | 719900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3599500  |
| value_loss         | 0.000361 |
---------------------------------
Eval num_timesteps=3600000, episode_reward=-4.90 +/- 0.30
Episode length: 569.10 +/- 86.68
---------------------------------
| explained_variance | 0.91     |
| fps                | 845      |
| nupdates           | 720000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3600000  |
| value_loss         | 3.03e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.117   |
| fps                | 845      |
| nupdates           | 720100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3600500  |
| value_loss         | 0.000442 |
---------------------------------
---------------------------------
| explained_variance | -17      |
| fps                | 84

---------------------------------
| explained_variance | -49.5    |
| fps                | 845      |
| nupdates           | 722900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3614500  |
| value_loss         | 0.0061   |
---------------------------------
---------------------------------
| explained_variance | 0.965    |
| fps                | 845      |
| nupdates           | 723000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3615000  |
| value_loss         | 3.77e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.978    |
| fps                | 845      |
| nupdates           | 723100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3615500  |
| value_loss         | 1.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 846      |
| nupdates           | 723200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.077   |
| fps                | 845      |
| nupdates           | 725900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3629500  |
| value_loss         | 0.000321 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 845      |
| nupdates           | 726000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3630000  |
| value_loss         | 1.03e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.224    |
| fps                | 845      |
| nupdates           | 726100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3630500  |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 845      |
| nupdates           | 726200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.669   |
| fps                | 846      |
| nupdates           | 729000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3645000  |
| value_loss         | 0.000284 |
---------------------------------
---------------------------------
| explained_variance | 0.953    |
| fps                | 846      |
| nupdates           | 729100   |
| policy_entropy     | 2.02     |
| total_timesteps    | 3645500  |
| value_loss         | 9.35e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.988    |
| fps                | 846      |
| nupdates           | 729200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3646000  |
| value_loss         | 2.29e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.411    |
| fps                | 846      |
| nupdates           | 729300   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.646    |
| fps                | 846      |
| nupdates           | 732000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3660000  |
| value_loss         | 9.58e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.817    |
| fps                | 846      |
| nupdates           | 732100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3660500  |
| value_loss         | 0.000183 |
---------------------------------
---------------------------------
| explained_variance | 0.708    |
| fps                | 846      |
| nupdates           | 732200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3661000  |
| value_loss         | 0.000324 |
---------------------------------
---------------------------------
| explained_variance | 0.0103   |
| fps                | 846      |
| nupdates           | 732300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.728    |
| fps                | 846      |
| nupdates           | 735100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3675500  |
| value_loss         | 3.25e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.659    |
| fps                | 846      |
| nupdates           | 735200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3676000  |
| value_loss         | 0.000423 |
---------------------------------
---------------------------------
| explained_variance | 0.826    |
| fps                | 846      |
| nupdates           | 735300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3676500  |
| value_loss         | 0.00012  |
---------------------------------
---------------------------------
| explained_variance | 0.0284   |
| fps                | 846      |
| nupdates           | 735400   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.96     |
| fps                | 846      |
| nupdates           | 738200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3691000  |
| value_loss         | 1.07e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.74    |
| fps                | 846      |
| nupdates           | 738300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3691500  |
| value_loss         | 0.000523 |
---------------------------------
---------------------------------
| explained_variance | 0.0416   |
| fps                | 846      |
| nupdates           | 738400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3692000  |
| value_loss         | 0.000252 |
---------------------------------
---------------------------------
| explained_variance | 0.971    |
| fps                | 846      |
| nupdates           | 738500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.444    |
| fps                | 846      |
| nupdates           | 741200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3706000  |
| value_loss         | 1.29e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.512    |
| fps                | 846      |
| nupdates           | 741300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3706500  |
| value_loss         | 0.00017  |
---------------------------------
---------------------------------
| explained_variance | -13.2    |
| fps                | 846      |
| nupdates           | 741400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3707000  |
| value_loss         | 0.000596 |
---------------------------------
---------------------------------
| explained_variance | -1.32    |
| fps                | 846      |
| nupdates           | 741500   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.892    |
| fps                | 846      |
| nupdates           | 744300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3721500  |
| value_loss         | 5.53e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.057   |
| fps                | 847      |
| nupdates           | 744400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3722000  |
| value_loss         | 0.000406 |
---------------------------------
---------------------------------
| explained_variance | 0.859    |
| fps                | 847      |
| nupdates           | 744500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3722500  |
| value_loss         | 0.000125 |
---------------------------------
---------------------------------
| explained_variance | 0.999    |
| fps                | 847      |
| nupdates           | 744600   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.783    |
| fps                | 846      |
| nupdates           | 747300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3736500  |
| value_loss         | 0.00022  |
---------------------------------
---------------------------------
| explained_variance | 0.956    |
| fps                | 846      |
| nupdates           | 747400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3737000  |
| value_loss         | 1.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.865    |
| fps                | 846      |
| nupdates           | 747500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3737500  |
| value_loss         | 1.31e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.818    |
| fps                | 846      |
| nupdates           | 747600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.89     |
| fps                | 846      |
| nupdates           | 750300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3751500  |
| value_loss         | 5.36e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0783   |
| fps                | 846      |
| nupdates           | 750400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3752000  |
| value_loss         | 3.27e-05 |
---------------------------------
---------------------------------
| explained_variance | -6.13    |
| fps                | 847      |
| nupdates           | 750500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3752500  |
| value_loss         | 0.000436 |
---------------------------------
---------------------------------
| explained_variance | 0.769    |
| fps                | 847      |
| nupdates           | 750600   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.958    |
| fps                | 847      |
| nupdates           | 753400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3767000  |
| value_loss         | 3.82e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.174    |
| fps                | 847      |
| nupdates           | 753500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3767500  |
| value_loss         | 0.000122 |
---------------------------------
---------------------------------
| explained_variance | 0.688    |
| fps                | 847      |
| nupdates           | 753600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3768000  |
| value_loss         | 6.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 847      |
| nupdates           | 753700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.0752   |
| fps                | 847      |
| nupdates           | 756400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3782000  |
| value_loss         | 0.000184 |
---------------------------------
---------------------------------
| explained_variance | 0.576    |
| fps                | 847      |
| nupdates           | 756500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3782500  |
| value_loss         | 0.000159 |
---------------------------------
---------------------------------
| explained_variance | 0.195    |
| fps                | 847      |
| nupdates           | 756600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3783000  |
| value_loss         | 0.000239 |
---------------------------------
---------------------------------
| explained_variance | 0.781    |
| fps                | 847      |
| nupdates           | 756700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.508    |
| fps                | 847      |
| nupdates           | 759500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3797500  |
| value_loss         | 5.49e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.938    |
| fps                | 848      |
| nupdates           | 759600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3798000  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | 0.862    |
| fps                | 848      |
| nupdates           | 759700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3798500  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | -0.446   |
| fps                | 848      |
| nupdates           | 759800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.367    |
| fps                | 847      |
| nupdates           | 762500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3812500  |
| value_loss         | 3.29e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.557    |
| fps                | 847      |
| nupdates           | 762600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3813000  |
| value_loss         | 5.49e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.577    |
| fps                | 847      |
| nupdates           | 762700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3813500  |
| value_loss         | 2.78e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.131   |
| fps                | 847      |
| nupdates           | 762800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.954    |
| fps                | 847      |
| nupdates           | 765500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3827500  |
| value_loss         | 9.51e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.747    |
| fps                | 847      |
| nupdates           | 765600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3828000  |
| value_loss         | 3.68e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.868    |
| fps                | 847      |
| nupdates           | 765700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3828500  |
| value_loss         | 1.03e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.5      |
| fps                | 847      |
| nupdates           | 765800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.983    |
| fps                | 848      |
| nupdates           | 768600   |
| policy_entropy     | 2.02     |
| total_timesteps    | 3843000  |
| value_loss         | 3.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.85     |
| fps                | 848      |
| nupdates           | 768700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3843500  |
| value_loss         | 2.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.3      |
| fps                | 848      |
| nupdates           | 768800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3844000  |
| value_loss         | 0.000325 |
---------------------------------
---------------------------------
| explained_variance | -0.566   |
| fps                | 848      |
| nupdates           | 768900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.191   |
| fps                | 847      |
| nupdates           | 771600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3858000  |
| value_loss         | 8.26e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.862    |
| fps                | 847      |
| nupdates           | 771700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3858500  |
| value_loss         | 8.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.622    |
| fps                | 847      |
| nupdates           | 771800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3859000  |
| value_loss         | 0.000152 |
---------------------------------
---------------------------------
| explained_variance | -4.05    |
| fps                | 847      |
| nupdates           | 771900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.379    |
| fps                | 848      |
| nupdates           | 774700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3873500  |
| value_loss         | 0.144    |
---------------------------------
---------------------------------
| explained_variance | 0.278    |
| fps                | 848      |
| nupdates           | 774800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3874000  |
| value_loss         | 8.13e-05 |
---------------------------------
---------------------------------
| explained_variance | -379     |
| fps                | 848      |
| nupdates           | 774900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3874500  |
| value_loss         | 0.00475  |
---------------------------------
Eval num_timesteps=3875000, episode_reward=-5.00 +/- 0.00
Episode length: 586.80 +/- 106.24
---------------------------------
| explained_variance | -5.52    |
| fps                | 8

---------------------------------
| explained_variance | 0.45     |
| fps                | 848      |
| nupdates           | 777700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3888500  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | -198     |
| fps                | 848      |
| nupdates           | 777800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3889000  |
| value_loss         | 0.00912  |
---------------------------------
---------------------------------
| explained_variance | -0.234   |
| fps                | 848      |
| nupdates           | 777900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3889500  |
| value_loss         | 0.00031  |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 848      |
| nupdates           | 778000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -170     |
| fps                | 848      |
| nupdates           | 780700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3903500  |
| value_loss         | 0.0138   |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 848      |
| nupdates           | 780800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3904000  |
| value_loss         | 4.29e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.965    |
| fps                | 848      |
| nupdates           | 780900   |
| policy_entropy     | 2        |
| total_timesteps    | 3904500  |
| value_loss         | 2.75e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.17    |
| fps                | 848      |
| nupdates           | 781000   |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.949    |
| fps                | 848      |
| nupdates           | 783800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3919000  |
| value_loss         | 4.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.291    |
| fps                | 848      |
| nupdates           | 783900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3919500  |
| value_loss         | 0.000149 |
---------------------------------
----------------------------------
| explained_variance | -2.09e+04 |
| fps                | 848       |
| nupdates           | 784000    |
| policy_entropy     | 2.06      |
| total_timesteps    | 3920000   |
| value_loss         | 0.183     |
----------------------------------
---------------------------------
| explained_variance | 0.0177   |
| fps                | 848      |
| nupdates           | 784100   |
| policy_entropy     | 2.05     |
| tota

---------------------------------
| explained_variance | 0.0217   |
| fps                | 848      |
| nupdates           | 786800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3934000  |
| value_loss         | 6.37e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.558   |
| fps                | 848      |
| nupdates           | 786900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3934500  |
| value_loss         | 0.000538 |
---------------------------------
---------------------------------
| explained_variance | 0.544    |
| fps                | 848      |
| nupdates           | 787000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3935000  |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | 0.779    |
| fps                | 848      |
| nupdates           | 787100   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.376    |
| fps                | 848      |
| nupdates           | 789900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3949500  |
| value_loss         | 0.000194 |
---------------------------------
Eval num_timesteps=3950000, episode_reward=-4.80 +/- 0.40
Episode length: 543.00 +/- 81.62
---------------------------------
| explained_variance | 0.605    |
| fps                | 848      |
| nupdates           | 790000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3950000  |
| value_loss         | 0.000189 |
---------------------------------
---------------------------------
| explained_variance | 0.602    |
| fps                | 848      |
| nupdates           | 790100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3950500  |
| value_loss         | 0.000294 |
---------------------------------
---------------------------------
| explained_variance | 0.835    |
| fps                | 84

---------------------------------
| explained_variance | 0.956    |
| fps                | 848      |
| nupdates           | 792900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3964500  |
| value_loss         | 1.53e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.566    |
| fps                | 848      |
| nupdates           | 793000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3965000  |
| value_loss         | 5.73e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.142    |
| fps                | 848      |
| nupdates           | 793100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3965500  |
| value_loss         | 0.000239 |
---------------------------------
---------------------------------
| explained_variance | 0.825    |
| fps                | 848      |
| nupdates           | 793200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.456    |
| fps                | 848      |
| nupdates           | 795900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3979500  |
| value_loss         | 7.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.581    |
| fps                | 848      |
| nupdates           | 796000   |
| policy_entropy     | 2        |
| total_timesteps    | 3980000  |
| value_loss         | 3.05e-05 |
---------------------------------
---------------------------------
| explained_variance | -50.1    |
| fps                | 848      |
| nupdates           | 796100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3980500  |
| value_loss         | 0.0122   |
---------------------------------
---------------------------------
| explained_variance | -760     |
| fps                | 848      |
| nupdates           | 796200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.872    |
| fps                | 849      |
| nupdates           | 799000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3995000  |
| value_loss         | 2.27e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.12    |
| fps                | 849      |
| nupdates           | 799100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3995500  |
| value_loss         | 0.000279 |
---------------------------------
---------------------------------
| explained_variance | -3.58    |
| fps                | 849      |
| nupdates           | 799200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3996000  |
| value_loss         | 0.000528 |
---------------------------------
---------------------------------
| explained_variance | 0.824    |
| fps                | 849      |
| nupdates           | 799300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.872    |
| fps                | 849      |
| nupdates           | 802000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4010000  |
| value_loss         | 5.06e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.477    |
| fps                | 849      |
| nupdates           | 802100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4010500  |
| value_loss         | 0.00128  |
---------------------------------
---------------------------------
| explained_variance | 0.985    |
| fps                | 849      |
| nupdates           | 802200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4011000  |
| value_loss         | 2.92e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.688    |
| fps                | 849      |
| nupdates           | 802300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -35.2    |
| fps                | 849      |
| nupdates           | 805100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4025500  |
| value_loss         | 0.0149   |
---------------------------------
---------------------------------
| explained_variance | 0.949    |
| fps                | 849      |
| nupdates           | 805200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4026000  |
| value_loss         | 3.96e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0308   |
| fps                | 849      |
| nupdates           | 805300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4026500  |
| value_loss         | 0.000117 |
---------------------------------
---------------------------------
| explained_variance | 0.212    |
| fps                | 849      |
| nupdates           | 805400   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.919    |
| fps                | 849      |
| nupdates           | 808200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4041000  |
| value_loss         | 3.97e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.516    |
| fps                | 849      |
| nupdates           | 808300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4041500  |
| value_loss         | 0.000171 |
---------------------------------
---------------------------------
| explained_variance | 0.682    |
| fps                | 849      |
| nupdates           | 808400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4042000  |
| value_loss         | 7.49e-05 |
---------------------------------
---------------------------------
| explained_variance | -11.6    |
| fps                | 849      |
| nupdates           | 808500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.47    |
| fps                | 849      |
| nupdates           | 811200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4056000  |
| value_loss         | 0.000375 |
---------------------------------
---------------------------------
| explained_variance | 0.807    |
| fps                | 849      |
| nupdates           | 811300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4056500  |
| value_loss         | 6.46e-06 |
---------------------------------
---------------------------------
| explained_variance | -46      |
| fps                | 849      |
| nupdates           | 811400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4057000  |
| value_loss         | 0.000666 |
---------------------------------
---------------------------------
| explained_variance | -2.31    |
| fps                | 849      |
| nupdates           | 811500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.783    |
| fps                | 850      |
| nupdates           | 814300   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4071500  |
| value_loss         | 1.87e-05 |
---------------------------------
---------------------------------
| explained_variance | -19.6    |
| fps                | 850      |
| nupdates           | 814400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4072000  |
| value_loss         | 0.000644 |
---------------------------------
---------------------------------
| explained_variance | 0.791    |
| fps                | 850      |
| nupdates           | 814500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4072500  |
| value_loss         | 7.28e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.635    |
| fps                | 850      |
| nupdates           | 814600   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.95    |
| fps                | 850      |
| nupdates           | 817300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4086500  |
| value_loss         | 0.00021  |
---------------------------------
---------------------------------
| explained_variance | -2.98    |
| fps                | 850      |
| nupdates           | 817400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4087000  |
| value_loss         | 0.000656 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 850      |
| nupdates           | 817500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4087500  |
| value_loss         | 2.4e-06  |
---------------------------------
---------------------------------
| explained_variance | -1.88    |
| fps                | 850      |
| nupdates           | 817600   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.572    |
| fps                | 849      |
| nupdates           | 820300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4101500  |
| value_loss         | 0.000224 |
---------------------------------
---------------------------------
| explained_variance | -300     |
| fps                | 849      |
| nupdates           | 820400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4102000  |
| value_loss         | 0.111    |
---------------------------------
---------------------------------
| explained_variance | 0.083    |
| fps                | 849      |
| nupdates           | 820500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4102500  |
| value_loss         | 7.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.362   |
| fps                | 849      |
| nupdates           | 820600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.687    |
| fps                | 850      |
| nupdates           | 823400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4117000  |
| value_loss         | 9.21e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.0254  |
| fps                | 850      |
| nupdates           | 823500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4117500  |
| value_loss         | 0.000513 |
---------------------------------
---------------------------------
| explained_variance | 0.619    |
| fps                | 850      |
| nupdates           | 823600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4118000  |
| value_loss         | 0.000202 |
---------------------------------
---------------------------------
| explained_variance | 0.487    |
| fps                | 850      |
| nupdates           | 823700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.344    |
| fps                | 850      |
| nupdates           | 826400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4132000  |
| value_loss         | 8.02e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.58    |
| fps                | 850      |
| nupdates           | 826500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4132500  |
| value_loss         | 0.00152  |
---------------------------------
---------------------------------
| explained_variance | -0.201   |
| fps                | 850      |
| nupdates           | 826600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4133000  |
| value_loss         | 0.000501 |
---------------------------------
---------------------------------
| explained_variance | -0.107   |
| fps                | 850      |
| nupdates           | 826700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.95    |
| fps                | 850      |
| nupdates           | 829500   |
| policy_entropy     | 1.99     |
| total_timesteps    | 4147500  |
| value_loss         | 0.000269 |
---------------------------------
---------------------------------
| explained_variance | 0.929    |
| fps                | 850      |
| nupdates           | 829600   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4148000  |
| value_loss         | 1.79e-05 |
---------------------------------
---------------------------------
| explained_variance | -101     |
| fps                | 850      |
| nupdates           | 829700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4148500  |
| value_loss         | 0.01     |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 850      |
| nupdates           | 829800   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.927    |
| fps                | 850      |
| nupdates           | 832500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4162500  |
| value_loss         | 6.93e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.885    |
| fps                | 850      |
| nupdates           | 832600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4163000  |
| value_loss         | 1.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.623    |
| fps                | 850      |
| nupdates           | 832700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4163500  |
| value_loss         | 8.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.577    |
| fps                | 850      |
| nupdates           | 832800   |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.927    |
| fps                | 850      |
| nupdates           | 835500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4177500  |
| value_loss         | 1.28e-05 |
---------------------------------
---------------------------------
| explained_variance | -14.3    |
| fps                | 850      |
| nupdates           | 835600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4178000  |
| value_loss         | 0.00153  |
---------------------------------
---------------------------------
| explained_variance | 0.437    |
| fps                | 850      |
| nupdates           | 835700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4178500  |
| value_loss         | 0.000142 |
---------------------------------
---------------------------------
| explained_variance | -0.675   |
| fps                | 850      |
| nupdates           | 835800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.226    |
| fps                | 851      |
| nupdates           | 838600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4193000  |
| value_loss         | 0.0289   |
---------------------------------
---------------------------------
| explained_variance | 0.953    |
| fps                | 851      |
| nupdates           | 838700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4193500  |
| value_loss         | 0.000144 |
---------------------------------
---------------------------------
| explained_variance | -0.0434  |
| fps                | 851      |
| nupdates           | 838800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4194000  |
| value_loss         | 0.000405 |
---------------------------------
---------------------------------
| explained_variance | 0.975    |
| fps                | 851      |
| nupdates           | 838900   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.688    |
| fps                | 850      |
| nupdates           | 841600   |
| policy_entropy     | 2        |
| total_timesteps    | 4208000  |
| value_loss         | 0.000325 |
---------------------------------
---------------------------------
| explained_variance | -1.31    |
| fps                | 851      |
| nupdates           | 841700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4208500  |
| value_loss         | 0.00151  |
---------------------------------
---------------------------------
| explained_variance | -0.0124  |
| fps                | 851      |
| nupdates           | 841800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4209000  |
| value_loss         | 0.188    |
---------------------------------
---------------------------------
| explained_variance | 0.69     |
| fps                | 851      |
| nupdates           | 841900   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -8.43    |
| fps                | 851      |
| nupdates           | 844700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4223500  |
| value_loss         | 0.00628  |
---------------------------------
---------------------------------
| explained_variance | -2.1     |
| fps                | 851      |
| nupdates           | 844800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4224000  |
| value_loss         | 0.000226 |
---------------------------------
---------------------------------
| explained_variance | 0.777    |
| fps                | 851      |
| nupdates           | 844900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4224500  |
| value_loss         | 7.45e-05 |
---------------------------------
Eval num_timesteps=4225000, episode_reward=-4.90 +/- 0.30
Episode length: 776.20 +/- 186.83
---------------------------------
| explained_variance | 0.646    |
| fps                | 8

---------------------------------
| explained_variance | 0.987    |
| fps                | 851      |
| nupdates           | 847700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4238500  |
| value_loss         | 0.000127 |
---------------------------------
---------------------------------
| explained_variance | -735     |
| fps                | 851      |
| nupdates           | 847800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4239000  |
| value_loss         | 0.15     |
---------------------------------
---------------------------------
| explained_variance | 0.832    |
| fps                | 851      |
| nupdates           | 847900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4239500  |
| value_loss         | 7.09e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.14    |
| fps                | 851      |
| nupdates           | 848000   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -1.43    |
| fps                | 850      |
| nupdates           | 850700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4253500  |
| value_loss         | 2.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.557    |
| fps                | 850      |
| nupdates           | 850800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4254000  |
| value_loss         | 2.6e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.374    |
| fps                | 850      |
| nupdates           | 850900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4254500  |
| value_loss         | 6.2e-05  |
---------------------------------
---------------------------------
| explained_variance | -1.44    |
| fps                | 850      |
| nupdates           | 851000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.951    |
| fps                | 851      |
| nupdates           | 853800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4269000  |
| value_loss         | 5.93e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.963    |
| fps                | 851      |
| nupdates           | 853900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4269500  |
| value_loss         | 2.95e-06 |
---------------------------------
---------------------------------
| explained_variance | -7.91    |
| fps                | 851      |
| nupdates           | 854000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4270000  |
| value_loss         | 0.000352 |
---------------------------------
---------------------------------
| explained_variance | 0.735    |
| fps                | 851      |
| nupdates           | 854100   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.801    |
| fps                | 851      |
| nupdates           | 856800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4284000  |
| value_loss         | 6.53e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.728    |
| fps                | 851      |
| nupdates           | 856900   |
| policy_entropy     | 2.01     |
| total_timesteps    | 4284500  |
| value_loss         | 0.000153 |
---------------------------------
---------------------------------
| explained_variance | 0.643    |
| fps                | 851      |
| nupdates           | 857000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4285000  |
| value_loss         | 2.03e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.686   |
| fps                | 851      |
| nupdates           | 857100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.69    |
| fps                | 851      |
| nupdates           | 859900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4299500  |
| value_loss         | 0.000268 |
---------------------------------
Eval num_timesteps=4300000, episode_reward=-4.70 +/- 0.46
Episode length: 680.40 +/- 188.59
---------------------------------
| explained_variance | 0.562    |
| fps                | 850      |
| nupdates           | 860000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4300000  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | 0.788    |
| fps                | 850      |
| nupdates           | 860100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4300500  |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | 0.939    |
| fps                | 8

---------------------------------
| explained_variance | -2.01    |
| fps                | 851      |
| nupdates           | 862900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4314500  |
| value_loss         | 0.000568 |
---------------------------------
---------------------------------
| explained_variance | -0.163   |
| fps                | 851      |
| nupdates           | 863000   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4315000  |
| value_loss         | 0.00026  |
---------------------------------
---------------------------------
| explained_variance | 0.877    |
| fps                | 851      |
| nupdates           | 863100   |
| policy_entropy     | 1.96     |
| total_timesteps    | 4315500  |
| value_loss         | 2.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 851      |
| nupdates           | 863200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.709   |
| fps                | 850      |
| nupdates           | 865900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4329500  |
| value_loss         | 0.000451 |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 850      |
| nupdates           | 866000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4330000  |
| value_loss         | 3.24e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.288    |
| fps                | 850      |
| nupdates           | 866100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4330500  |
| value_loss         | 4.57e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.757    |
| fps                | 850      |
| nupdates           | 866200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.12    |
| fps                | 850      |
| nupdates           | 869000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4345000  |
| value_loss         | 3.84e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.202   |
| fps                | 850      |
| nupdates           | 869100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4345500  |
| value_loss         | 0.000163 |
---------------------------------
---------------------------------
| explained_variance | 0.287    |
| fps                | 851      |
| nupdates           | 869200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4346000  |
| value_loss         | 0.000214 |
---------------------------------
---------------------------------
| explained_variance | 0.576    |
| fps                | 851      |
| nupdates           | 869300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.31    |
| fps                | 850      |
| nupdates           | 872000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4360000  |
| value_loss         | 0.000549 |
---------------------------------
---------------------------------
| explained_variance | 0.584    |
| fps                | 850      |
| nupdates           | 872100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4360500  |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | 0.492    |
| fps                | 850      |
| nupdates           | 872200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4361000  |
| value_loss         | 0.000346 |
---------------------------------
---------------------------------
| explained_variance | -28.6    |
| fps                | 849      |
| nupdates           | 872300   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.941    |
| fps                | 849      |
| nupdates           | 875100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4375500  |
| value_loss         | 1.37e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.41    |
| fps                | 849      |
| nupdates           | 875200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4376000  |
| value_loss         | 0.000526 |
---------------------------------
---------------------------------
| explained_variance | -1.54    |
| fps                | 849      |
| nupdates           | 875300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4376500  |
| value_loss         | 3.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.657    |
| fps                | 849      |
| nupdates           | 875400   |
| policy_entropy     | 1.96     |
| total_timest

---------------------------------
| explained_variance | -0.569   |
| fps                | 849      |
| nupdates           | 878200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4391000  |
| value_loss         | 0.000515 |
---------------------------------
---------------------------------
| explained_variance | 0.836    |
| fps                | 849      |
| nupdates           | 878300   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4391500  |
| value_loss         | 4.6e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.827    |
| fps                | 849      |
| nupdates           | 878400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4392000  |
| value_loss         | 0.00024  |
---------------------------------
---------------------------------
| explained_variance | -7.37    |
| fps                | 849      |
| nupdates           | 878500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0212  |
| fps                | 848      |
| nupdates           | 881200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4406000  |
| value_loss         | 0.259    |
---------------------------------
---------------------------------
| explained_variance | 0.435    |
| fps                | 848      |
| nupdates           | 881300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4406500  |
| value_loss         | 0.133    |
---------------------------------
---------------------------------
| explained_variance | 0.29     |
| fps                | 848      |
| nupdates           | 881400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4407000  |
| value_loss         | 0.000157 |
---------------------------------
---------------------------------
| explained_variance | -1.26    |
| fps                | 848      |
| nupdates           | 881500   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -3.97    |
| fps                | 849      |
| nupdates           | 884300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4421500  |
| value_loss         | 7.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.973    |
| fps                | 849      |
| nupdates           | 884400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4422000  |
| value_loss         | 1.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.864    |
| fps                | 849      |
| nupdates           | 884500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4422500  |
| value_loss         | 9.46e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.294    |
| fps                | 849      |
| nupdates           | 884600   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.959    |
| fps                | 848      |
| nupdates           | 887300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4436500  |
| value_loss         | 3.33e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.518    |
| fps                | 848      |
| nupdates           | 887400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4437000  |
| value_loss         | 0.000173 |
---------------------------------
---------------------------------
| explained_variance | -16.7    |
| fps                | 848      |
| nupdates           | 887500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4437500  |
| value_loss         | 0.000175 |
---------------------------------
---------------------------------
| explained_variance | -384     |
| fps                | 848      |
| nupdates           | 887600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.141    |
| fps                | 848      |
| nupdates           | 890300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4451500  |
| value_loss         | 7.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0866   |
| fps                | 848      |
| nupdates           | 890400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4452000  |
| value_loss         | 0.00202  |
---------------------------------
---------------------------------
| explained_variance | -0.562   |
| fps                | 848      |
| nupdates           | 890500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4452500  |
| value_loss         | 0.000316 |
---------------------------------
---------------------------------
| explained_variance | -0.927   |
| fps                | 848      |
| nupdates           | 890600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.09    |
| fps                | 848      |
| nupdates           | 893400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4467000  |
| value_loss         | 5.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.441    |
| fps                | 848      |
| nupdates           | 893500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4467500  |
| value_loss         | 0.000193 |
---------------------------------
---------------------------------
| explained_variance | 0.673    |
| fps                | 848      |
| nupdates           | 893600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4468000  |
| value_loss         | 0.00023  |
---------------------------------
---------------------------------
| explained_variance | -0.0173  |
| fps                | 848      |
| nupdates           | 893700   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.827    |
| fps                | 847      |
| nupdates           | 896400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4482000  |
| value_loss         | 7.86e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.869    |
| fps                | 847      |
| nupdates           | 896500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4482500  |
| value_loss         | 0.000133 |
---------------------------------
---------------------------------
| explained_variance | -0.65    |
| fps                | 847      |
| nupdates           | 896600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4483000  |
| value_loss         | 0.000813 |
---------------------------------
---------------------------------
| explained_variance | 0.729    |
| fps                | 847      |
| nupdates           | 896700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.221    |
| fps                | 848      |
| nupdates           | 899500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4497500  |
| value_loss         | 0.000215 |
---------------------------------
---------------------------------
| explained_variance | -1.57    |
| fps                | 848      |
| nupdates           | 899600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4498000  |
| value_loss         | 0.000853 |
---------------------------------
---------------------------------
| explained_variance | 0.307    |
| fps                | 848      |
| nupdates           | 899700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4498500  |
| value_loss         | 9.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.627    |
| fps                | 848      |
| nupdates           | 899800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.964    |
| fps                | 847      |
| nupdates           | 902500   |
| policy_entropy     | 1.99     |
| total_timesteps    | 4512500  |
| value_loss         | 2.37e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.707    |
| fps                | 847      |
| nupdates           | 902600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4513000  |
| value_loss         | 0.000167 |
---------------------------------
---------------------------------
| explained_variance | 0.956    |
| fps                | 847      |
| nupdates           | 902700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4513500  |
| value_loss         | 3.43e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.663    |
| fps                | 847      |
| nupdates           | 902800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -19.4    |
| fps                | 847      |
| nupdates           | 905500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4527500  |
| value_loss         | 0.000756 |
---------------------------------
---------------------------------
| explained_variance | -0.505   |
| fps                | 847      |
| nupdates           | 905600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4528000  |
| value_loss         | 5.22e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 847      |
| nupdates           | 905700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4528500  |
| value_loss         | 1.54e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.918    |
| fps                | 847      |
| nupdates           | 905800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.634    |
| fps                | 847      |
| nupdates           | 908600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4543000  |
| value_loss         | 4.93e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.282   |
| fps                | 847      |
| nupdates           | 908700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4543500  |
| value_loss         | 0.000356 |
---------------------------------
---------------------------------
| explained_variance | 0.842    |
| fps                | 847      |
| nupdates           | 908800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4544000  |
| value_loss         | 1.9e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.901    |
| fps                | 847      |
| nupdates           | 908900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.963    |
| fps                | 847      |
| nupdates           | 911600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4558000  |
| value_loss         | 4.99e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.594    |
| fps                | 847      |
| nupdates           | 911700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4558500  |
| value_loss         | 6.75e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0115  |
| fps                | 847      |
| nupdates           | 911800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4559000  |
| value_loss         | 0.000322 |
---------------------------------
---------------------------------
| explained_variance | 0.888    |
| fps                | 847      |
| nupdates           | 911900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.771    |
| fps                | 847      |
| nupdates           | 914700   |
| policy_entropy     | 2        |
| total_timesteps    | 4573500  |
| value_loss         | 7.63e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.94     |
| fps                | 847      |
| nupdates           | 914800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4574000  |
| value_loss         | 3.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.904    |
| fps                | 847      |
| nupdates           | 914900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4574500  |
| value_loss         | 1.09e-05 |
---------------------------------
Eval num_timesteps=4575000, episode_reward=-5.00 +/- 0.00
Episode length: 549.70 +/- 35.70
---------------------------------
| explained_variance | 0.512    |
| fps                | 84

---------------------------------
| explained_variance | 0.628    |
| fps                | 846      |
| nupdates           | 917700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4588500  |
| value_loss         | 3.36e-05 |
---------------------------------
---------------------------------
| explained_variance | -6.53    |
| fps                | 847      |
| nupdates           | 917800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4589000  |
| value_loss         | 0.0015   |
---------------------------------
---------------------------------
| explained_variance | 0.872    |
| fps                | 847      |
| nupdates           | 917900   |
| policy_entropy     | 1.92     |
| total_timesteps    | 4589500  |
| value_loss         | 0.000994 |
---------------------------------
---------------------------------
| explained_variance | -0.00635 |
| fps                | 847      |
| nupdates           | 918000   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.679    |
| fps                | 846      |
| nupdates           | 920700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4603500  |
| value_loss         | 1.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 846      |
| nupdates           | 920800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4604000  |
| value_loss         | 4.88e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 846      |
| nupdates           | 920900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4604500  |
| value_loss         | 0.000958 |
---------------------------------
---------------------------------
| explained_variance | 0.887    |
| fps                | 846      |
| nupdates           | 921000   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.919    |
| fps                | 847      |
| nupdates           | 923800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4619000  |
| value_loss         | 6.89e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.961    |
| fps                | 847      |
| nupdates           | 923900   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4619500  |
| value_loss         | 2.82e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.954    |
| fps                | 847      |
| nupdates           | 924000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4620000  |
| value_loss         | 0.000109 |
---------------------------------
---------------------------------
| explained_variance | 0.823    |
| fps                | 847      |
| nupdates           | 924100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.638    |
| fps                | 846      |
| nupdates           | 926800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4634000  |
| value_loss         | 0.000301 |
---------------------------------
---------------------------------
| explained_variance | 0.876    |
| fps                | 846      |
| nupdates           | 926900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4634500  |
| value_loss         | 9.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 846      |
| nupdates           | 927000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4635000  |
| value_loss         | 2.23e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.669    |
| fps                | 846      |
| nupdates           | 927100   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.961    |
| fps                | 847      |
| nupdates           | 929900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4649500  |
| value_loss         | 2.34e-05 |
---------------------------------
Eval num_timesteps=4650000, episode_reward=-4.70 +/- 0.46
Episode length: 821.30 +/- 190.11
---------------------------------
| explained_variance | 0.955    |
| fps                | 846      |
| nupdates           | 930000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4650000  |
| value_loss         | 1.98e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 846      |
| nupdates           | 930100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4650500  |
| value_loss         | 2.65e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.18    |
| fps                | 8

---------------------------------
| explained_variance | 0.701    |
| fps                | 846      |
| nupdates           | 932900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4664500  |
| value_loss         | 2.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.974    |
| fps                | 846      |
| nupdates           | 933000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4665000  |
| value_loss         | 4.54e-06 |
---------------------------------
---------------------------------
| explained_variance | -2.19    |
| fps                | 846      |
| nupdates           | 933100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4665500  |
| value_loss         | 0.00193  |
---------------------------------
---------------------------------
| explained_variance | 0.932    |
| fps                | 846      |
| nupdates           | 933200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.916    |
| fps                | 846      |
| nupdates           | 935900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4679500  |
| value_loss         | 0.000379 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 846      |
| nupdates           | 936000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4680000  |
| value_loss         | 0.00127  |
---------------------------------
---------------------------------
| explained_variance | 0.00615  |
| fps                | 846      |
| nupdates           | 936100   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4680500  |
| value_loss         | 7.05e-05 |
---------------------------------
---------------------------------
| explained_variance | -18.3    |
| fps                | 846      |
| nupdates           | 936200   |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.757    |
| fps                | 846      |
| nupdates           | 939000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4695000  |
| value_loss         | 4.63e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 846      |
| nupdates           | 939100   |
| policy_entropy     | 2        |
| total_timesteps    | 4695500  |
| value_loss         | 5.86e-06 |
---------------------------------
---------------------------------
| explained_variance | -13.8    |
| fps                | 846      |
| nupdates           | 939200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4696000  |
| value_loss         | 0.00122  |
---------------------------------
----------------------------------
| explained_variance | -3.67e+04 |
| fps                | 846       |
| nupdates           | 939300    |
| policy_entropy     | 2.06      |
| total_t

---------------------------------
| explained_variance | -0.614   |
| fps                | 846      |
| nupdates           | 942000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4710000  |
| value_loss         | 6.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 846      |
| nupdates           | 942100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4710500  |
| value_loss         | 2.23e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.18    |
| fps                | 846      |
| nupdates           | 942200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4711000  |
| value_loss         | 0.000362 |
---------------------------------
---------------------------------
| explained_variance | -0.267   |
| fps                | 846      |
| nupdates           | 942300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -30.8    |
| fps                | 846      |
| nupdates           | 945100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4725500  |
| value_loss         | 0.000424 |
---------------------------------
---------------------------------
| explained_variance | 0.935    |
| fps                | 846      |
| nupdates           | 945200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4726000  |
| value_loss         | 3.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.666    |
| fps                | 846      |
| nupdates           | 945300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4726500  |
| value_loss         | 1.17e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.679    |
| fps                | 846      |
| nupdates           | 945400   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.903    |
| fps                | 847      |
| nupdates           | 948200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4741000  |
| value_loss         | 3.49e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 847      |
| nupdates           | 948300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4741500  |
| value_loss         | 1.46e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.11    |
| fps                | 847      |
| nupdates           | 948400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4742000  |
| value_loss         | 0.000406 |
---------------------------------
---------------------------------
| explained_variance | -6.85    |
| fps                | 847      |
| nupdates           | 948500   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.914    |
| fps                | 847      |
| nupdates           | 951200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4756000  |
| value_loss         | 0.000112 |
---------------------------------
---------------------------------
| explained_variance | -0.319   |
| fps                | 847      |
| nupdates           | 951300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4756500  |
| value_loss         | 0.00102  |
---------------------------------
---------------------------------
| explained_variance | 0.847    |
| fps                | 847      |
| nupdates           | 951400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4757000  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | 0.675    |
| fps                | 847      |
| nupdates           | 951500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.211    |
| fps                | 847      |
| nupdates           | 954300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4771500  |
| value_loss         | 0.00039  |
---------------------------------
---------------------------------
| explained_variance | -3.76    |
| fps                | 847      |
| nupdates           | 954400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4772000  |
| value_loss         | 0.00207  |
---------------------------------
---------------------------------
| explained_variance | -6.83    |
| fps                | 847      |
| nupdates           | 954500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4772500  |
| value_loss         | 0.0012   |
---------------------------------
---------------------------------
| explained_variance | 0.753    |
| fps                | 847      |
| nupdates           | 954600   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -8.01    |
| fps                | 847      |
| nupdates           | 957300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4786500  |
| value_loss         | 0.000299 |
---------------------------------
---------------------------------
| explained_variance | -2.44    |
| fps                | 847      |
| nupdates           | 957400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4787000  |
| value_loss         | 0.000914 |
---------------------------------
---------------------------------
| explained_variance | 0.952    |
| fps                | 847      |
| nupdates           | 957500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4787500  |
| value_loss         | 0.000129 |
---------------------------------
---------------------------------
| explained_variance | 0.964    |
| fps                | 847      |
| nupdates           | 957600   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -73.2    |
| fps                | 847      |
| nupdates           | 960300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4801500  |
| value_loss         | 0.00825  |
---------------------------------
---------------------------------
| explained_variance | 0.666    |
| fps                | 847      |
| nupdates           | 960400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4802000  |
| value_loss         | 0.000298 |
---------------------------------
---------------------------------
| explained_variance | 0.947    |
| fps                | 847      |
| nupdates           | 960500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4802500  |
| value_loss         | 3.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.235    |
| fps                | 847      |
| nupdates           | 960600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.529   |
| fps                | 847      |
| nupdates           | 963400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4817000  |
| value_loss         | 5.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.625    |
| fps                | 847      |
| nupdates           | 963500   |
| policy_entropy     | 2        |
| total_timesteps    | 4817500  |
| value_loss         | 3.22e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 847      |
| nupdates           | 963600   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4818000  |
| value_loss         | 2.37e-07 |
---------------------------------
---------------------------------
| explained_variance | -23.4    |
| fps                | 847      |
| nupdates           | 963700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.988    |
| fps                | 847      |
| nupdates           | 966400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4832000  |
| value_loss         | 3.28e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.714    |
| fps                | 847      |
| nupdates           | 966500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4832500  |
| value_loss         | 2.54e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.71    |
| fps                | 847      |
| nupdates           | 966600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4833000  |
| value_loss         | 0.00285  |
---------------------------------
---------------------------------
| explained_variance | -2.54    |
| fps                | 847      |
| nupdates           | 966700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.998    |
| fps                | 847      |
| nupdates           | 969500   |
| policy_entropy     | 1.97     |
| total_timesteps    | 4847500  |
| value_loss         | 0.00499  |
---------------------------------
---------------------------------
| explained_variance | -8.5     |
| fps                | 847      |
| nupdates           | 969600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4848000  |
| value_loss         | 0.000686 |
---------------------------------
---------------------------------
| explained_variance | 0.884    |
| fps                | 847      |
| nupdates           | 969700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4848500  |
| value_loss         | 1.31e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 847      |
| nupdates           | 969800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.655    |
| fps                | 847      |
| nupdates           | 972500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4862500  |
| value_loss         | 3.48e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.21    |
| fps                | 847      |
| nupdates           | 972600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4863000  |
| value_loss         | 0.000394 |
---------------------------------
---------------------------------
| explained_variance | 0.35     |
| fps                | 847      |
| nupdates           | 972700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4863500  |
| value_loss         | 0.000121 |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 847      |
| nupdates           | 972800   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.974    |
| fps                | 847      |
| nupdates           | 975500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4877500  |
| value_loss         | 5.95e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.626   |
| fps                | 847      |
| nupdates           | 975600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4878000  |
| value_loss         | 0.000518 |
---------------------------------
---------------------------------
| explained_variance | 0.908    |
| fps                | 847      |
| nupdates           | 975700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4878500  |
| value_loss         | 3.2e-05  |
---------------------------------
---------------------------------
| explained_variance | -1.76    |
| fps                | 847      |
| nupdates           | 975800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.725    |
| fps                | 847      |
| nupdates           | 978600   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4893000  |
| value_loss         | 8.28e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 847      |
| nupdates           | 978700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4893500  |
| value_loss         | 4.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.686    |
| fps                | 847      |
| nupdates           | 978800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4894000  |
| value_loss         | 0.000582 |
---------------------------------
---------------------------------
| explained_variance | 0.797    |
| fps                | 847      |
| nupdates           | 978900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.987    |
| fps                | 847      |
| nupdates           | 981600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4908000  |
| value_loss         | 1.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.67    |
| fps                | 847      |
| nupdates           | 981700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4908500  |
| value_loss         | 0.000872 |
---------------------------------
---------------------------------
| explained_variance | 0.348    |
| fps                | 847      |
| nupdates           | 981800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4909000  |
| value_loss         | 0.103    |
---------------------------------
---------------------------------
| explained_variance | 0.979    |
| fps                | 847      |
| nupdates           | 981900   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.0733   |
| fps                | 847      |
| nupdates           | 984700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4923500  |
| value_loss         | 0.000491 |
---------------------------------
---------------------------------
| explained_variance | -0.304   |
| fps                | 847      |
| nupdates           | 984800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4924000  |
| value_loss         | 4.91e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.53    |
| fps                | 847      |
| nupdates           | 984900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4924500  |
| value_loss         | 0.000246 |
---------------------------------
Eval num_timesteps=4925000, episode_reward=-4.90 +/- 0.30
Episode length: 601.60 +/- 71.74
---------------------------------
| explained_variance | -32.2    |
| fps                | 84

---------------------------------
| explained_variance | -0.036   |
| fps                | 847      |
| nupdates           | 987700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4938500  |
| value_loss         | 0.000563 |
---------------------------------
---------------------------------
| explained_variance | 0.835    |
| fps                | 847      |
| nupdates           | 987800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4939000  |
| value_loss         | 1.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.876    |
| fps                | 847      |
| nupdates           | 987900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4939500  |
| value_loss         | 1.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.0124   |
| fps                | 847      |
| nupdates           | 988000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.216   |
| fps                | 847      |
| nupdates           | 990700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4953500  |
| value_loss         | 1.24e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.894    |
| fps                | 847      |
| nupdates           | 990800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4954000  |
| value_loss         | 7.44e-06 |
---------------------------------
---------------------------------
| explained_variance | -14.3    |
| fps                | 847      |
| nupdates           | 990900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4954500  |
| value_loss         | 0.00158  |
---------------------------------
---------------------------------
| explained_variance | 0.729    |
| fps                | 847      |
| nupdates           | 991000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.982    |
| fps                | 847      |
| nupdates           | 993800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4969000  |
| value_loss         | 3.85e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.123   |
| fps                | 847      |
| nupdates           | 993900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4969500  |
| value_loss         | 0.000437 |
---------------------------------
----------------------------------
| explained_variance | -3.71e+03 |
| fps                | 847       |
| nupdates           | 994000    |
| policy_entropy     | 2.05      |
| total_timesteps    | 4970000   |
| value_loss         | 0.0662    |
----------------------------------
---------------------------------
| explained_variance | -7.42    |
| fps                | 847      |
| nupdates           | 994100   |
| policy_entropy     | 2        |
| tota

---------------------------------
| explained_variance | 0.727    |
| fps                | 846      |
| nupdates           | 996800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4984000  |
| value_loss         | 1.55e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.807    |
| fps                | 846      |
| nupdates           | 996900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4984500  |
| value_loss         | 3.28e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.851    |
| fps                | 846      |
| nupdates           | 997000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4985000  |
| value_loss         | 2.25e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.451   |
| fps                | 846      |
| nupdates           | 997100   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.933    |
| fps                | 846      |
| nupdates           | 999900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4999500  |
| value_loss         | 1.39e-05 |
---------------------------------
Eval num_timesteps=5000000, episode_reward=-4.90 +/- 0.30
Episode length: 575.40 +/- 68.76
---------------------------------
| explained_variance | 0.975    |
| fps                | 846      |
| nupdates           | 1000000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5000000  |
| value_loss         | 3.03e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.92    |
| fps                | 846      |
| nupdates           | 1000100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5000500  |
| value_loss         | 9.54e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.962    |
| fps                | 84

---------------------------------
| explained_variance | 0.903    |
| fps                | 846      |
| nupdates           | 1002900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5014500  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.72     |
| fps                | 846      |
| nupdates           | 1003000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5015000  |
| value_loss         | 5.35e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.691    |
| fps                | 846      |
| nupdates           | 1003100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5015500  |
| value_loss         | 4.09e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.999    |
| fps                | 846      |
| nupdates           | 1003200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.47    |
| fps                | 846      |
| nupdates           | 1005900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5029500  |
| value_loss         | 0.00223  |
---------------------------------
---------------------------------
| explained_variance | 0.837    |
| fps                | 846      |
| nupdates           | 1006000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5030000  |
| value_loss         | 0.000133 |
---------------------------------
----------------------------------
| explained_variance | -7.53e+03 |
| fps                | 846       |
| nupdates           | 1006100   |
| policy_entropy     | 2.06      |
| total_timesteps    | 5030500   |
| value_loss         | 0.16      |
----------------------------------
---------------------------------
| explained_variance | -2.99    |
| fps                | 846      |
| nupdates           | 1006200  |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | 0.888    |
| fps                | 847      |
| nupdates           | 1009000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5045000  |
| value_loss         | 0.000249 |
---------------------------------
---------------------------------
| explained_variance | 0.92     |
| fps                | 847      |
| nupdates           | 1009100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5045500  |
| value_loss         | 5.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.367    |
| fps                | 847      |
| nupdates           | 1009200  |
| policy_entropy     | 2.01     |
| total_timesteps    | 5046000  |
| value_loss         | 0.149    |
---------------------------------
---------------------------------
| explained_variance | 0.752    |
| fps                | 847      |
| nupdates           | 1009300  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.579    |
| fps                | 846      |
| nupdates           | 1012000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5060000  |
| value_loss         | 9.63e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 846      |
| nupdates           | 1012100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5060500  |
| value_loss         | 8.02e-06 |
---------------------------------
---------------------------------
| explained_variance | -3.15    |
| fps                | 846      |
| nupdates           | 1012200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5061000  |
| value_loss         | 0.000362 |
---------------------------------
---------------------------------
| explained_variance | -1.29    |
| fps                | 846      |
| nupdates           | 1012300  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.676    |
| fps                | 846      |
| nupdates           | 1015100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5075500  |
| value_loss         | 0.000185 |
---------------------------------
---------------------------------
| explained_variance | 0.809    |
| fps                | 846      |
| nupdates           | 1015200  |
| policy_entropy     | 2.02     |
| total_timesteps    | 5076000  |
| value_loss         | 6.49e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.941    |
| fps                | 846      |
| nupdates           | 1015300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5076500  |
| value_loss         | 8.06e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.793    |
| fps                | 846      |
| nupdates           | 1015400  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.0458   |
| fps                | 847      |
| nupdates           | 1018200  |
| policy_entropy     | 1.96     |
| total_timesteps    | 5091000  |
| value_loss         | 1.6      |
---------------------------------
---------------------------------
| explained_variance | 0.505    |
| fps                | 847      |
| nupdates           | 1018300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5091500  |
| value_loss         | 8.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.57    |
| fps                | 847      |
| nupdates           | 1018400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5092000  |
| value_loss         | 0.000438 |
---------------------------------
---------------------------------
| explained_variance | 0.571    |
| fps                | 847      |
| nupdates           | 1018500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.18    |
| fps                | 846      |
| nupdates           | 1021200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5106000  |
| value_loss         | 9.1e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.723   |
| fps                | 846      |
| nupdates           | 1021300  |
| policy_entropy     | 2.02     |
| total_timesteps    | 5106500  |
| value_loss         | 0.000565 |
---------------------------------
---------------------------------
| explained_variance | 0.566    |
| fps                | 846      |
| nupdates           | 1021400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5107000  |
| value_loss         | 2.97e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.332    |
| fps                | 846      |
| nupdates           | 1021500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.863    |
| fps                | 847      |
| nupdates           | 1024300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5121500  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | 0.943    |
| fps                | 847      |
| nupdates           | 1024400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5122000  |
| value_loss         | 8.93e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.023   |
| fps                | 847      |
| nupdates           | 1024500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5122500  |
| value_loss         | 0.000175 |
---------------------------------
---------------------------------
| explained_variance | -1.83    |
| fps                | 847      |
| nupdates           | 1024600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.2     |
| fps                | 846      |
| nupdates           | 1027300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5136500  |
| value_loss         | 0.00134  |
---------------------------------
---------------------------------
| explained_variance | 0.954    |
| fps                | 846      |
| nupdates           | 1027400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5137000  |
| value_loss         | 1.93e-05 |
---------------------------------
---------------------------------
| explained_variance | -41.3    |
| fps                | 846      |
| nupdates           | 1027500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5137500  |
| value_loss         | 0.00419  |
---------------------------------
---------------------------------
| explained_variance | 0.94     |
| fps                | 846      |
| nupdates           | 1027600  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.625    |
| fps                | 846      |
| nupdates           | 1030300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5151500  |
| value_loss         | 1.73e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.931    |
| fps                | 846      |
| nupdates           | 1030400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5152000  |
| value_loss         | 0.00416  |
---------------------------------
---------------------------------
| explained_variance | -0.737   |
| fps                | 846      |
| nupdates           | 1030500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5152500  |
| value_loss         | 6.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.894    |
| fps                | 846      |
| nupdates           | 1030600  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.873    |
| fps                | 846      |
| nupdates           | 1033400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5167000  |
| value_loss         | 7.23e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.22     |
| fps                | 846      |
| nupdates           | 1033500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5167500  |
| value_loss         | 0.000251 |
---------------------------------
---------------------------------
| explained_variance | -0.337   |
| fps                | 846      |
| nupdates           | 1033600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5168000  |
| value_loss         | 0.000916 |
---------------------------------
---------------------------------
| explained_variance | 0.592    |
| fps                | 846      |
| nupdates           | 1033700  |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | -0.47    |
| fps                | 846      |
| nupdates           | 1036400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5182000  |
| value_loss         | 4.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.323    |
| fps                | 846      |
| nupdates           | 1036500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5182500  |
| value_loss         | 0.198    |
---------------------------------
---------------------------------
| explained_variance | 0.185    |
| fps                | 846      |
| nupdates           | 1036600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5183000  |
| value_loss         | 0.000281 |
---------------------------------
---------------------------------
| explained_variance | 0.902    |
| fps                | 846      |
| nupdates           | 1036700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.4     |
| fps                | 845      |
| nupdates           | 1039500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5197500  |
| value_loss         | 0.000915 |
---------------------------------
---------------------------------
| explained_variance | -8.83    |
| fps                | 845      |
| nupdates           | 1039600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5198000  |
| value_loss         | 0.000784 |
---------------------------------
---------------------------------
| explained_variance | -0.462   |
| fps                | 845      |
| nupdates           | 1039700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5198500  |
| value_loss         | 6.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 845      |
| nupdates           | 1039800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.358    |
| fps                | 845      |
| nupdates           | 1042500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5212500  |
| value_loss         | 0.000893 |
---------------------------------
---------------------------------
| explained_variance | 0.941    |
| fps                | 845      |
| nupdates           | 1042600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5213000  |
| value_loss         | 5.62e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.954    |
| fps                | 845      |
| nupdates           | 1042700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5213500  |
| value_loss         | 4.09e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.221   |
| fps                | 845      |
| nupdates           | 1042800  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.771    |
| fps                | 845      |
| nupdates           | 1045500  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5227500  |
| value_loss         | 0.000119 |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 845      |
| nupdates           | 1045600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5228000  |
| value_loss         | 1.9e-06  |
---------------------------------
----------------------------------
| explained_variance | -1.02e+03 |
| fps                | 845       |
| nupdates           | 1045700   |
| policy_entropy     | 2.06      |
| total_timesteps    | 5228500   |
| value_loss         | 0.0646    |
----------------------------------
---------------------------------
| explained_variance | 0.664    |
| fps                | 845      |
| nupdates           | 1045800  |
| policy_entropy     | 2.05     |
| tota

---------------------------------
| explained_variance | 0.974    |
| fps                | 845      |
| nupdates           | 1048600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5243000  |
| value_loss         | 4.03e-06 |
---------------------------------
---------------------------------
| explained_variance | -3.85    |
| fps                | 845      |
| nupdates           | 1048700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5243500  |
| value_loss         | 0.000755 |
---------------------------------
---------------------------------
| explained_variance | 0.352    |
| fps                | 845      |
| nupdates           | 1048800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5244000  |
| value_loss         | 0.101    |
---------------------------------
---------------------------------
| explained_variance | 0.792    |
| fps                | 845      |
| nupdates           | 1048900  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -25.1    |
| fps                | 844      |
| nupdates           | 1051600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5258000  |
| value_loss         | 0.00087  |
---------------------------------
---------------------------------
| explained_variance | 0.309    |
| fps                | 844      |
| nupdates           | 1051700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5258500  |
| value_loss         | 2.54e-05 |
---------------------------------
----------------------------------
| explained_variance | -1.87e+03 |
| fps                | 844       |
| nupdates           | 1051800   |
| policy_entropy     | 2.07      |
| total_timesteps    | 5259000   |
| value_loss         | 0.0864    |
----------------------------------
---------------------------------
| explained_variance | -0.996   |
| fps                | 844      |
| nupdates           | 1051900  |
| policy_entropy     | 2.07     |
| tota

---------------------------------
| explained_variance | -0.319   |
| fps                | 845      |
| nupdates           | 1054700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5273500  |
| value_loss         | 0.000122 |
---------------------------------
---------------------------------
| explained_variance | 0.921    |
| fps                | 845      |
| nupdates           | 1054800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5274000  |
| value_loss         | 1.89e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0866  |
| fps                | 845      |
| nupdates           | 1054900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5274500  |
| value_loss         | 0.000217 |
---------------------------------
Eval num_timesteps=5275000, episode_reward=-5.00 +/- 0.00
Episode length: 688.60 +/- 177.54
---------------------------------
| explained_variance | -491     |
| fps                | 8

---------------------------------
| explained_variance | -2.27    |
| fps                | 844      |
| nupdates           | 1057700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5288500  |
| value_loss         | 5.24e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.595    |
| fps                | 844      |
| nupdates           | 1057800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5289000  |
| value_loss         | 1.86e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.833    |
| fps                | 844      |
| nupdates           | 1057900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5289500  |
| value_loss         | 0.000286 |
---------------------------------
---------------------------------
| explained_variance | 0.894    |
| fps                | 844      |
| nupdates           | 1058000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.224    |
| fps                | 844      |
| nupdates           | 1060700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5303500  |
| value_loss         | 0.000372 |
---------------------------------
---------------------------------
| explained_variance | -0.15    |
| fps                | 844      |
| nupdates           | 1060800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5304000  |
| value_loss         | 0.000243 |
---------------------------------
---------------------------------
| explained_variance | 0.457    |
| fps                | 844      |
| nupdates           | 1060900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5304500  |
| value_loss         | 2.8e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.00676 |
| fps                | 844      |
| nupdates           | 1061000  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.444    |
| fps                | 844      |
| nupdates           | 1063800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5319000  |
| value_loss         | 0.000153 |
---------------------------------
---------------------------------
| explained_variance | 0.587    |
| fps                | 844      |
| nupdates           | 1063900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5319500  |
| value_loss         | 6.98e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.471    |
| fps                | 844      |
| nupdates           | 1064000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5320000  |
| value_loss         | 3.97e-05 |
---------------------------------
----------------------------------
| explained_variance | -2.61e+03 |
| fps                | 844       |
| nupdates           | 1064100   |
| policy_entropy     | 2.07      |
| total_t

---------------------------------
| explained_variance | -5.15    |
| fps                | 844      |
| nupdates           | 1066800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5334000  |
| value_loss         | 0.000735 |
---------------------------------
---------------------------------
| explained_variance | 0.908    |
| fps                | 844      |
| nupdates           | 1066900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5334500  |
| value_loss         | 1.19e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.954    |
| fps                | 844      |
| nupdates           | 1067000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5335000  |
| value_loss         | 1.3e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.7     |
| fps                | 844      |
| nupdates           | 1067100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.06    |
| fps                | 844      |
| nupdates           | 1069900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5349500  |
| value_loss         | 0.00627  |
---------------------------------
Eval num_timesteps=5350000, episode_reward=-4.80 +/- 0.40
Episode length: 566.60 +/- 68.68
---------------------------------
| explained_variance | 0.784    |
| fps                | 843      |
| nupdates           | 1070000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5350000  |
| value_loss         | 2.98e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.867    |
| fps                | 843      |
| nupdates           | 1070100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5350500  |
| value_loss         | 4.89e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.243    |
| fps                | 84

---------------------------------
| explained_variance | -1.65    |
| fps                | 843      |
| nupdates           | 1072900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5364500  |
| value_loss         | 0.000129 |
---------------------------------
---------------------------------
| explained_variance | 0.308    |
| fps                | 843      |
| nupdates           | 1073000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5365000  |
| value_loss         | 0.000182 |
---------------------------------
---------------------------------
| explained_variance | 0.287    |
| fps                | 843      |
| nupdates           | 1073100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5365500  |
| value_loss         | 4.82e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.71    |
| fps                | 843      |
| nupdates           | 1073200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.203    |
| fps                | 841      |
| nupdates           | 1075900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5379500  |
| value_loss         | 0.000265 |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 841      |
| nupdates           | 1076000  |
| policy_entropy     | 2.02     |
| total_timesteps    | 5380000  |
| value_loss         | 6.27e-07 |
---------------------------------
---------------------------------
| explained_variance | -5.33    |
| fps                | 841      |
| nupdates           | 1076100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5380500  |
| value_loss         | 0.00978  |
---------------------------------
---------------------------------
| explained_variance | -0.0059  |
| fps                | 841      |
| nupdates           | 1076200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.473    |
| fps                | 841      |
| nupdates           | 1079000  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5395000  |
| value_loss         | 0.000368 |
---------------------------------
---------------------------------
| explained_variance | 0.791    |
| fps                | 841      |
| nupdates           | 1079100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5395500  |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | 0.243    |
| fps                | 841      |
| nupdates           | 1079200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5396000  |
| value_loss         | 0.000151 |
---------------------------------
---------------------------------
| explained_variance | 0.979    |
| fps                | 841      |
| nupdates           | 1079300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.647    |
| fps                | 841      |
| nupdates           | 1082000  |
| policy_entropy     | 2.01     |
| total_timesteps    | 5410000  |
| value_loss         | 0.000173 |
---------------------------------
---------------------------------
| explained_variance | 0.923    |
| fps                | 841      |
| nupdates           | 1082100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5410500  |
| value_loss         | 1.6e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 841      |
| nupdates           | 1082200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5411000  |
| value_loss         | 4.01e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.671    |
| fps                | 841      |
| nupdates           | 1082300  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.872    |
| fps                | 840      |
| nupdates           | 1085100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5425500  |
| value_loss         | 4.25e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.763    |
| fps                | 840      |
| nupdates           | 1085200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5426000  |
| value_loss         | 6.89e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.605    |
| fps                | 840      |
| nupdates           | 1085300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5426500  |
| value_loss         | 2.97e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.09    |
| fps                | 840      |
| nupdates           | 1085400  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -2.07    |
| fps                | 841      |
| nupdates           | 1088200  |
| policy_entropy     | 2.01     |
| total_timesteps    | 5441000  |
| value_loss         | 0.00254  |
---------------------------------
---------------------------------
| explained_variance | -0.786   |
| fps                | 841      |
| nupdates           | 1088300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5441500  |
| value_loss         | 0.00019  |
---------------------------------
---------------------------------
| explained_variance | 0.893    |
| fps                | 841      |
| nupdates           | 1088400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5442000  |
| value_loss         | 1.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.57     |
| fps                | 841      |
| nupdates           | 1088500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.107    |
| fps                | 840      |
| nupdates           | 1091200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5456000  |
| value_loss         | 0.000102 |
---------------------------------
---------------------------------
| explained_variance | 0.948    |
| fps                | 840      |
| nupdates           | 1091300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5456500  |
| value_loss         | 0.000855 |
---------------------------------
---------------------------------
| explained_variance | -6.25    |
| fps                | 840      |
| nupdates           | 1091400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5457000  |
| value_loss         | 0.000796 |
---------------------------------
---------------------------------
| explained_variance | -0.787   |
| fps                | 840      |
| nupdates           | 1091500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.867    |
| fps                | 841      |
| nupdates           | 1094300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5471500  |
| value_loss         | 7.48e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.56    |
| fps                | 841      |
| nupdates           | 1094400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5472000  |
| value_loss         | 2.06e-05 |
---------------------------------
---------------------------------
| explained_variance | -147     |
| fps                | 841      |
| nupdates           | 1094500  |
| policy_entropy     | 1.84     |
| total_timesteps    | 5472500  |
| value_loss         | 0.000658 |
---------------------------------
---------------------------------
| explained_variance | -0.355   |
| fps                | 841      |
| nupdates           | 1094600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.232   |
| fps                | 840      |
| nupdates           | 1097300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5486500  |
| value_loss         | 0.00437  |
---------------------------------
---------------------------------
| explained_variance | 0.792    |
| fps                | 840      |
| nupdates           | 1097400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5487000  |
| value_loss         | 1.68e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.971    |
| fps                | 840      |
| nupdates           | 1097500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5487500  |
| value_loss         | 2.26e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.515    |
| fps                | 840      |
| nupdates           | 1097600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -14.4    |
| fps                | 840      |
| nupdates           | 1100300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5501500  |
| value_loss         | 0.00227  |
---------------------------------
---------------------------------
| explained_variance | -0.852   |
| fps                | 840      |
| nupdates           | 1100400  |
| policy_entropy     | 1.94     |
| total_timesteps    | 5502000  |
| value_loss         | 0.000247 |
---------------------------------
---------------------------------
| explained_variance | 0.673    |
| fps                | 840      |
| nupdates           | 1100500  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5502500  |
| value_loss         | 0.00852  |
---------------------------------
---------------------------------
| explained_variance | 0.905    |
| fps                | 840      |
| nupdates           | 1100600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.345    |
| fps                | 840      |
| nupdates           | 1103400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5517000  |
| value_loss         | 0.000403 |
---------------------------------
---------------------------------
| explained_variance | 0.931    |
| fps                | 840      |
| nupdates           | 1103500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5517500  |
| value_loss         | 2.29e-06 |
---------------------------------
---------------------------------
| explained_variance | -7.16    |
| fps                | 840      |
| nupdates           | 1103600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5518000  |
| value_loss         | 0.00141  |
---------------------------------
---------------------------------
| explained_variance | 0.999    |
| fps                | 840      |
| nupdates           | 1103700  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -10.3    |
| fps                | 840      |
| nupdates           | 1106400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5532000  |
| value_loss         | 0.00164  |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 840      |
| nupdates           | 1106500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5532500  |
| value_loss         | 1.75e-05 |
---------------------------------
---------------------------------
| explained_variance | -10.2    |
| fps                | 840      |
| nupdates           | 1106600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5533000  |
| value_loss         | 0.00044  |
---------------------------------
---------------------------------
| explained_variance | 0.979    |
| fps                | 840      |
| nupdates           | 1106700  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.716    |
| fps                | 840      |
| nupdates           | 1109500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5547500  |
| value_loss         | 4.08e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.01    |
| fps                | 840      |
| nupdates           | 1109600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5548000  |
| value_loss         | 0.0012   |
---------------------------------
---------------------------------
| explained_variance | 0.94     |
| fps                | 840      |
| nupdates           | 1109700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5548500  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.264    |
| fps                | 840      |
| nupdates           | 1109800  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.0803   |
| fps                | 840      |
| nupdates           | 1112500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5562500  |
| value_loss         | 0.000345 |
---------------------------------
---------------------------------
| explained_variance | 0.698    |
| fps                | 840      |
| nupdates           | 1112600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5563000  |
| value_loss         | 0.000249 |
---------------------------------
---------------------------------
| explained_variance | -2.36    |
| fps                | 840      |
| nupdates           | 1112700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5563500  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | 0.928    |
| fps                | 840      |
| nupdates           | 1112800  |
| policy_entropy     | 2.06     |
| total_timest

----------------------------------
| explained_variance | -3.19e+03 |
| fps                | 840       |
| nupdates           | 1115500   |
| policy_entropy     | 1.97      |
| total_timesteps    | 5577500   |
| value_loss         | 0.0644    |
----------------------------------
---------------------------------
| explained_variance | 0.221    |
| fps                | 840      |
| nupdates           | 1115600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5578000  |
| value_loss         | 1.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.845    |
| fps                | 840      |
| nupdates           | 1115700  |
| policy_entropy     | 1.93     |
| total_timesteps    | 5578500  |
| value_loss         | 0.00153  |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 840      |
| nupdates           | 1115800  |
| policy_entropy     | 1.84     |
| tota

---------------------------------
| explained_variance | -0.243   |
| fps                | 840      |
| nupdates           | 1118600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5593000  |
| value_loss         | 0.000214 |
---------------------------------
---------------------------------
| explained_variance | -0.213   |
| fps                | 840      |
| nupdates           | 1118700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5593500  |
| value_loss         | 0.000295 |
---------------------------------
---------------------------------
| explained_variance | 0.161    |
| fps                | 840      |
| nupdates           | 1118800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5594000  |
| value_loss         | 0.000269 |
---------------------------------
---------------------------------
| explained_variance | -0.878   |
| fps                | 840      |
| nupdates           | 1118900  |
| policy_entropy     | 1.59     |
| total_timest

---------------------------------
| explained_variance | -1.39    |
| fps                | 840      |
| nupdates           | 1121600  |
| policy_entropy     | 1.98     |
| total_timesteps    | 5608000  |
| value_loss         | 0.0015   |
---------------------------------
---------------------------------
| explained_variance | 0.382    |
| fps                | 840      |
| nupdates           | 1121700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5608500  |
| value_loss         | 0.000142 |
---------------------------------
---------------------------------
| explained_variance | -0.111   |
| fps                | 840      |
| nupdates           | 1121800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5609000  |
| value_loss         | 5.3e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.947    |
| fps                | 840      |
| nupdates           | 1121900  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.963   |
| fps                | 840      |
| nupdates           | 1124700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5623500  |
| value_loss         | 0.000143 |
---------------------------------
---------------------------------
| explained_variance | 0.532    |
| fps                | 840      |
| nupdates           | 1124800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5624000  |
| value_loss         | 5.81e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.977   |
| fps                | 840      |
| nupdates           | 1124900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5624500  |
| value_loss         | 0.000745 |
---------------------------------
Eval num_timesteps=5625000, episode_reward=-4.80 +/- 0.40
Episode length: 576.10 +/- 119.90
---------------------------------
| explained_variance | 0.685    |
| fps                | 8

---------------------------------
| explained_variance | 0.993    |
| fps                | 840      |
| nupdates           | 1127700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5638500  |
| value_loss         | 1.18e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.591    |
| fps                | 840      |
| nupdates           | 1127800  |
| policy_entropy     | 2.01     |
| total_timesteps    | 5639000  |
| value_loss         | 9.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.97     |
| fps                | 840      |
| nupdates           | 1127900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5639500  |
| value_loss         | 1.65e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.656    |
| fps                | 840      |
| nupdates           | 1128000  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.152   |
| fps                | 840      |
| nupdates           | 1130700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5653500  |
| value_loss         | 0.000146 |
---------------------------------
---------------------------------
| explained_variance | 0.0847   |
| fps                | 840      |
| nupdates           | 1130800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5654000  |
| value_loss         | 5.91e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.849    |
| fps                | 840      |
| nupdates           | 1130900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5654500  |
| value_loss         | 1.51e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.973    |
| fps                | 840      |
| nupdates           | 1131000  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.29     |
| fps                | 840      |
| nupdates           | 1133800  |
| policy_entropy     | 2.01     |
| total_timesteps    | 5669000  |
| value_loss         | 0.229    |
---------------------------------
---------------------------------
| explained_variance | 0.987    |
| fps                | 840      |
| nupdates           | 1133900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5669500  |
| value_loss         | 3.34e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.812    |
| fps                | 840      |
| nupdates           | 1134000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5670000  |
| value_loss         | 8.72e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.937    |
| fps                | 840      |
| nupdates           | 1134100  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.953    |
| fps                | 840      |
| nupdates           | 1136800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5684000  |
| value_loss         | 3.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.449    |
| fps                | 840      |
| nupdates           | 1136900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5684500  |
| value_loss         | 0.000334 |
---------------------------------
---------------------------------
| explained_variance | 0.96     |
| fps                | 840      |
| nupdates           | 1137000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5685000  |
| value_loss         | 8.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.895    |
| fps                | 840      |
| nupdates           | 1137100  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -4.9     |
| fps                | 841      |
| nupdates           | 1139900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5699500  |
| value_loss         | 0.000215 |
---------------------------------
Eval num_timesteps=5700000, episode_reward=-4.80 +/- 0.40
Episode length: 641.80 +/- 185.38
---------------------------------
| explained_variance | 0.0379   |
| fps                | 840      |
| nupdates           | 1140000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5700000  |
| value_loss         | 0.000141 |
---------------------------------
---------------------------------
| explained_variance | -2.94    |
| fps                | 840      |
| nupdates           | 1140100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5700500  |
| value_loss         | 0.0017   |
---------------------------------
---------------------------------
| explained_variance | 0.27     |
| fps                | 8

---------------------------------
| explained_variance | 0.136    |
| fps                | 840      |
| nupdates           | 1142900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5714500  |
| value_loss         | 0.00015  |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 840      |
| nupdates           | 1143000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5715000  |
| value_loss         | 7.24e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.719    |
| fps                | 840      |
| nupdates           | 1143100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5715500  |
| value_loss         | 4.51e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 840      |
| nupdates           | 1143200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.929    |
| fps                | 840      |
| nupdates           | 1145900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5729500  |
| value_loss         | 4.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.843    |
| fps                | 840      |
| nupdates           | 1146000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5730000  |
| value_loss         | 0.000351 |
---------------------------------
---------------------------------
| explained_variance | 0.587    |
| fps                | 840      |
| nupdates           | 1146100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5730500  |
| value_loss         | 9.17e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.906    |
| fps                | 840      |
| nupdates           | 1146200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.998    |
| fps                | 841      |
| nupdates           | 1149000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5745000  |
| value_loss         | 4.27e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.561    |
| fps                | 841      |
| nupdates           | 1149100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5745500  |
| value_loss         | 0.000198 |
---------------------------------
---------------------------------
| explained_variance | 0.151    |
| fps                | 841      |
| nupdates           | 1149200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5746000  |
| value_loss         | 2.21e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.13    |
| fps                | 841      |
| nupdates           | 1149300  |
| policy_entropy     | 1.9      |
| total_timest

---------------------------------
| explained_variance | 0.937    |
| fps                | 840      |
| nupdates           | 1152000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5760000  |
| value_loss         | 6.17e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.922    |
| fps                | 840      |
| nupdates           | 1152100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5760500  |
| value_loss         | 0.000231 |
---------------------------------
---------------------------------
| explained_variance | 0.817    |
| fps                | 840      |
| nupdates           | 1152200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5761000  |
| value_loss         | 0.000159 |
---------------------------------
---------------------------------
| explained_variance | 0.58     |
| fps                | 840      |
| nupdates           | 1152300  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.896    |
| fps                | 840      |
| nupdates           | 1155100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5775500  |
| value_loss         | 7.11e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.595    |
| fps                | 840      |
| nupdates           | 1155200  |
| policy_entropy     | 2        |
| total_timesteps    | 5776000  |
| value_loss         | 0.000527 |
---------------------------------
---------------------------------
| explained_variance | -0.13    |
| fps                | 840      |
| nupdates           | 1155300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5776500  |
| value_loss         | 0.000295 |
---------------------------------
---------------------------------
| explained_variance | -535     |
| fps                | 840      |
| nupdates           | 1155400  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.297    |
| fps                | 840      |
| nupdates           | 1158200  |
| policy_entropy     | 2.02     |
| total_timesteps    | 5791000  |
| value_loss         | 0.000233 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 840      |
| nupdates           | 1158300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5791500  |
| value_loss         | 7.9e-06  |
---------------------------------
---------------------------------
| explained_variance | -2.49    |
| fps                | 840      |
| nupdates           | 1158400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5792000  |
| value_loss         | 0.000214 |
---------------------------------
---------------------------------
| explained_variance | 0.751    |
| fps                | 840      |
| nupdates           | 1158500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.699    |
| fps                | 840      |
| nupdates           | 1161200  |
| policy_entropy     | 1.83     |
| total_timesteps    | 5806000  |
| value_loss         | 0.00276  |
---------------------------------
---------------------------------
| explained_variance | 0.982    |
| fps                | 840      |
| nupdates           | 1161300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5806500  |
| value_loss         | 5.09e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.932    |
| fps                | 840      |
| nupdates           | 1161400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5807000  |
| value_loss         | 5.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.617    |
| fps                | 840      |
| nupdates           | 1161500  |
| policy_entropy     | 2.01     |
| total_timest

----------------------------------
| explained_variance | -1.04e+03 |
| fps                | 841       |
| nupdates           | 1164300   |
| policy_entropy     | 2.04      |
| total_timesteps    | 5821500   |
| value_loss         | 0.0877    |
----------------------------------
---------------------------------
| explained_variance | 0.883    |
| fps                | 841      |
| nupdates           | 1164400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5822000  |
| value_loss         | 3.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.949    |
| fps                | 841      |
| nupdates           | 1164500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5822500  |
| value_loss         | 9.41e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.48     |
| fps                | 841      |
| nupdates           | 1164600  |
| policy_entropy     | 2.03     |
| tota

---------------------------------
| explained_variance | 0.332    |
| fps                | 840      |
| nupdates           | 1167300  |
| policy_entropy     | 1.58     |
| total_timesteps    | 5836500  |
| value_loss         | 0.184    |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 840      |
| nupdates           | 1167400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5837000  |
| value_loss         | 6.53e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.529    |
| fps                | 840      |
| nupdates           | 1167500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5837500  |
| value_loss         | 0.000127 |
---------------------------------
---------------------------------
| explained_variance | 0.802    |
| fps                | 840      |
| nupdates           | 1167600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.379   |
| fps                | 840      |
| nupdates           | 1170300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5851500  |
| value_loss         | 4.64e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 840      |
| nupdates           | 1170400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5852000  |
| value_loss         | 6.54e-07 |
---------------------------------
---------------------------------
| explained_variance | -7.31    |
| fps                | 840      |
| nupdates           | 1170500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5852500  |
| value_loss         | 0.00022  |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 840      |
| nupdates           | 1170600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.56    |
| fps                | 841      |
| nupdates           | 1173400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5867000  |
| value_loss         | 0.000296 |
---------------------------------
---------------------------------
| explained_variance | -6.71    |
| fps                | 841      |
| nupdates           | 1173500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5867500  |
| value_loss         | 0.00109  |
---------------------------------
---------------------------------
| explained_variance | 0.843    |
| fps                | 841      |
| nupdates           | 1173600  |
| policy_entropy     | 2        |
| total_timesteps    | 5868000  |
| value_loss         | 4.4e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.828    |
| fps                | 841      |
| nupdates           | 1173700  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.553    |
| fps                | 841      |
| nupdates           | 1176400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5882000  |
| value_loss         | 5.9e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.692    |
| fps                | 841      |
| nupdates           | 1176500  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5882500  |
| value_loss         | 0.000144 |
---------------------------------
---------------------------------
| explained_variance | 0.832    |
| fps                | 841      |
| nupdates           | 1176600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5883000  |
| value_loss         | 5.39e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.823    |
| fps                | 841      |
| nupdates           | 1176700  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.869    |
| fps                | 841      |
| nupdates           | 1179500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5897500  |
| value_loss         | 3.26e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.671    |
| fps                | 841      |
| nupdates           | 1179600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5898000  |
| value_loss         | 4.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.118    |
| fps                | 841      |
| nupdates           | 1179700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5898500  |
| value_loss         | 0.000754 |
---------------------------------
---------------------------------
| explained_variance | 0.895    |
| fps                | 841      |
| nupdates           | 1179800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.984    |
| fps                | 841      |
| nupdates           | 1182500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5912500  |
| value_loss         | 2.22e-05 |
---------------------------------
---------------------------------
| explained_variance | -39.5    |
| fps                | 841      |
| nupdates           | 1182600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5913000  |
| value_loss         | 0.0198   |
---------------------------------
---------------------------------
| explained_variance | -14.5    |
| fps                | 841      |
| nupdates           | 1182700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5913500  |
| value_loss         | 0.00458  |
---------------------------------
---------------------------------
| explained_variance | -0.214   |
| fps                | 841      |
| nupdates           | 1182800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.1     |
| fps                | 840      |
| nupdates           | 1185500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5927500  |
| value_loss         | 3.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.605    |
| fps                | 840      |
| nupdates           | 1185600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5928000  |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | 0.544    |
| fps                | 840      |
| nupdates           | 1185700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5928500  |
| value_loss         | 5.31e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.718    |
| fps                | 840      |
| nupdates           | 1185800  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.802    |
| fps                | 841      |
| nupdates           | 1188600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5943000  |
| value_loss         | 0.000154 |
---------------------------------
---------------------------------
| explained_variance | 0.756    |
| fps                | 841      |
| nupdates           | 1188700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5943500  |
| value_loss         | 2.34e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.964    |
| fps                | 841      |
| nupdates           | 1188800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5944000  |
| value_loss         | 9.94e-07 |
---------------------------------
---------------------------------
| explained_variance | -8.91    |
| fps                | 841      |
| nupdates           | 1188900  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.813    |
| fps                | 841      |
| nupdates           | 1191600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5958000  |
| value_loss         | 8.78e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.958    |
| fps                | 841      |
| nupdates           | 1191700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5958500  |
| value_loss         | 2.99e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.376    |
| fps                | 841      |
| nupdates           | 1191800  |
| policy_entropy     | 2.02     |
| total_timesteps    | 5959000  |
| value_loss         | 0.145    |
---------------------------------
---------------------------------
| explained_variance | 0.324    |
| fps                | 841      |
| nupdates           | 1191900  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.643    |
| fps                | 841      |
| nupdates           | 1194700  |
| policy_entropy     | 1.99     |
| total_timesteps    | 5973500  |
| value_loss         | 0.00241  |
---------------------------------
---------------------------------
| explained_variance | 0.896    |
| fps                | 841      |
| nupdates           | 1194800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5974000  |
| value_loss         | 8.57e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.774    |
| fps                | 841      |
| nupdates           | 1194900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5974500  |
| value_loss         | 0.000221 |
---------------------------------
Eval num_timesteps=5975000, episode_reward=-5.00 +/- 0.00
Episode length: 603.60 +/- 71.08
---------------------------------
| explained_variance | -1.16    |
| fps                | 84

---------------------------------
| explained_variance | 0.781    |
| fps                | 841      |
| nupdates           | 1197700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5988500  |
| value_loss         | 0.00012  |
---------------------------------
---------------------------------
| explained_variance | 0.744    |
| fps                | 841      |
| nupdates           | 1197800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5989000  |
| value_loss         | 1.63e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.585    |
| fps                | 841      |
| nupdates           | 1197900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5989500  |
| value_loss         | 0.000654 |
---------------------------------
---------------------------------
| explained_variance | 0.211    |
| fps                | 841      |
| nupdates           | 1198000  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.895    |
| fps                | 841      |
| nupdates           | 1200700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6003500  |
| value_loss         | 3.59e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.152    |
| fps                | 841      |
| nupdates           | 1200800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6004000  |
| value_loss         | 0.000308 |
---------------------------------
---------------------------------
| explained_variance | 0.957    |
| fps                | 841      |
| nupdates           | 1200900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6004500  |
| value_loss         | 8.37e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.755    |
| fps                | 841      |
| nupdates           | 1201000  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.164    |
| fps                | 841      |
| nupdates           | 1203800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6019000  |
| value_loss         | 0.000181 |
---------------------------------
---------------------------------
| explained_variance | -0.335   |
| fps                | 841      |
| nupdates           | 1203900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6019500  |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | 0.97     |
| fps                | 841      |
| nupdates           | 1204000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6020000  |
| value_loss         | 6.07e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.756    |
| fps                | 841      |
| nupdates           | 1204100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.0318  |
| fps                | 841      |
| nupdates           | 1206800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6034000  |
| value_loss         | 0.000304 |
---------------------------------
---------------------------------
| explained_variance | 0.785    |
| fps                | 841      |
| nupdates           | 1206900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6034500  |
| value_loss         | 1.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.674    |
| fps                | 841      |
| nupdates           | 1207000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6035000  |
| value_loss         | 0.000315 |
---------------------------------
---------------------------------
| explained_variance | 0.963    |
| fps                | 841      |
| nupdates           | 1207100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.136   |
| fps                | 841      |
| nupdates           | 1209900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6049500  |
| value_loss         | 0.000135 |
---------------------------------
Eval num_timesteps=6050000, episode_reward=-4.90 +/- 0.30
Episode length: 700.20 +/- 144.94
---------------------------------
| explained_variance | 0.021    |
| fps                | 840      |
| nupdates           | 1210000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6050000  |
| value_loss         | 0.000378 |
---------------------------------
---------------------------------
| explained_variance | 0.358    |
| fps                | 841      |
| nupdates           | 1210100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6050500  |
| value_loss         | 0.000264 |
---------------------------------
---------------------------------
| explained_variance | 0.979    |
| fps                | 8

---------------------------------
| explained_variance | 0.828    |
| fps                | 841      |
| nupdates           | 1212900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6064500  |
| value_loss         | 1.4e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.126   |
| fps                | 841      |
| nupdates           | 1213000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6065000  |
| value_loss         | 0.00027  |
---------------------------------
---------------------------------
| explained_variance | 0.723    |
| fps                | 841      |
| nupdates           | 1213100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6065500  |
| value_loss         | 1.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.921    |
| fps                | 841      |
| nupdates           | 1213200  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -5.72    |
| fps                | 841      |
| nupdates           | 1215900  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6079500  |
| value_loss         | 0.000433 |
---------------------------------
---------------------------------
| explained_variance | 0.689    |
| fps                | 841      |
| nupdates           | 1216000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6080000  |
| value_loss         | 9.92e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.169    |
| fps                | 841      |
| nupdates           | 1216100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6080500  |
| value_loss         | 2.59e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.27    |
| fps                | 841      |
| nupdates           | 1216200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.967    |
| fps                | 841      |
| nupdates           | 1219000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6095000  |
| value_loss         | 0.000384 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 841      |
| nupdates           | 1219100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6095500  |
| value_loss         | 1.55e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0499   |
| fps                | 841      |
| nupdates           | 1219200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6096000  |
| value_loss         | 0.000276 |
---------------------------------
---------------------------------
| explained_variance | 0.808    |
| fps                | 841      |
| nupdates           | 1219300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.378   |
| fps                | 841      |
| nupdates           | 1222000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6110000  |
| value_loss         | 0.00138  |
---------------------------------
---------------------------------
| explained_variance | 0.286    |
| fps                | 841      |
| nupdates           | 1222100  |
| policy_entropy     | 1.94     |
| total_timesteps    | 6110500  |
| value_loss         | 0.000448 |
---------------------------------
---------------------------------
| explained_variance | -0.588   |
| fps                | 841      |
| nupdates           | 1222200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6111000  |
| value_loss         | 7.2e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.864    |
| fps                | 841      |
| nupdates           | 1222300  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -4.74    |
| fps                | 841      |
| nupdates           | 1225100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6125500  |
| value_loss         | 0.00563  |
---------------------------------
---------------------------------
| explained_variance | -28.5    |
| fps                | 841      |
| nupdates           | 1225200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6126000  |
| value_loss         | 0.000661 |
---------------------------------
---------------------------------
| explained_variance | 0.816    |
| fps                | 841      |
| nupdates           | 1225300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6126500  |
| value_loss         | 0.000173 |
---------------------------------
---------------------------------
| explained_variance | 0.956    |
| fps                | 841      |
| nupdates           | 1225400  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.606    |
| fps                | 841      |
| nupdates           | 1228200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6141000  |
| value_loss         | 0.000585 |
---------------------------------
---------------------------------
| explained_variance | 0.646    |
| fps                | 841      |
| nupdates           | 1228300  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6141500  |
| value_loss         | 6.46e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.55    |
| fps                | 841      |
| nupdates           | 1228400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6142000  |
| value_loss         | 0.000905 |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 841      |
| nupdates           | 1228500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -3.44    |
| fps                | 841      |
| nupdates           | 1231200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6156000  |
| value_loss         | 2.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 841      |
| nupdates           | 1231300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6156500  |
| value_loss         | 8.32e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.507    |
| fps                | 841      |
| nupdates           | 1231400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6157000  |
| value_loss         | 0.000169 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 841      |
| nupdates           | 1231500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.865    |
| fps                | 842      |
| nupdates           | 1234300  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6171500  |
| value_loss         | 7.77e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.636    |
| fps                | 842      |
| nupdates           | 1234400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6172000  |
| value_loss         | 0.000166 |
---------------------------------
---------------------------------
| explained_variance | -1.15    |
| fps                | 842      |
| nupdates           | 1234500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6172500  |
| value_loss         | 0.000805 |
---------------------------------
---------------------------------
| explained_variance | 0.864    |
| fps                | 842      |
| nupdates           | 1234600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.8      |
| fps                | 842      |
| nupdates           | 1237300  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6186500  |
| value_loss         | 6.68e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.541    |
| fps                | 842      |
| nupdates           | 1237400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6187000  |
| value_loss         | 6.6e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.537    |
| fps                | 842      |
| nupdates           | 1237500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6187500  |
| value_loss         | 0.935    |
---------------------------------
---------------------------------
| explained_variance | 0.163    |
| fps                | 842      |
| nupdates           | 1237600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -177     |
| fps                | 841      |
| nupdates           | 1240300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6201500  |
| value_loss         | 0.0528   |
---------------------------------
---------------------------------
| explained_variance | -0.378   |
| fps                | 841      |
| nupdates           | 1240400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6202000  |
| value_loss         | 0.000204 |
---------------------------------
---------------------------------
| explained_variance | 0.444    |
| fps                | 841      |
| nupdates           | 1240500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6202500  |
| value_loss         | 3.41e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.276   |
| fps                | 842      |
| nupdates           | 1240600  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.297    |
| fps                | 842      |
| nupdates           | 1243400  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6217000  |
| value_loss         | 0.000539 |
---------------------------------
---------------------------------
| explained_variance | 0.336    |
| fps                | 842      |
| nupdates           | 1243500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6217500  |
| value_loss         | 0.00014  |
---------------------------------
---------------------------------
| explained_variance | 0.958    |
| fps                | 842      |
| nupdates           | 1243600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6218000  |
| value_loss         | 9.93e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.355   |
| fps                | 842      |
| nupdates           | 1243700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.858    |
| fps                | 842      |
| nupdates           | 1246400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6232000  |
| value_loss         | 8.93e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.361   |
| fps                | 842      |
| nupdates           | 1246500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6232500  |
| value_loss         | 1.51e-05 |
---------------------------------
---------------------------------
| explained_variance | -13.8    |
| fps                | 842      |
| nupdates           | 1246600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6233000  |
| value_loss         | 0.00438  |
---------------------------------
---------------------------------
| explained_variance | 0.162    |
| fps                | 842      |
| nupdates           | 1246700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.675    |
| fps                | 842      |
| nupdates           | 1249500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6247500  |
| value_loss         | 1.53e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.825    |
| fps                | 842      |
| nupdates           | 1249600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6248000  |
| value_loss         | 8.79e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.988    |
| fps                | 842      |
| nupdates           | 1249700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6248500  |
| value_loss         | 3.1e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.463   |
| fps                | 842      |
| nupdates           | 1249800  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | -9.87    |
| fps                | 842      |
| nupdates           | 1252500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6262500  |
| value_loss         | 0.0025   |
---------------------------------
---------------------------------
| explained_variance | 0.881    |
| fps                | 842      |
| nupdates           | 1252600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6263000  |
| value_loss         | 2.67e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.222   |
| fps                | 842      |
| nupdates           | 1252700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6263500  |
| value_loss         | 0.000432 |
---------------------------------
---------------------------------
| explained_variance | 0.917    |
| fps                | 842      |
| nupdates           | 1252800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -43.3    |
| fps                | 842      |
| nupdates           | 1255500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6277500  |
| value_loss         | 0.00381  |
---------------------------------
---------------------------------
| explained_variance | 0.955    |
| fps                | 842      |
| nupdates           | 1255600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6278000  |
| value_loss         | 4.91e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.231    |
| fps                | 842      |
| nupdates           | 1255700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6278500  |
| value_loss         | 0.000236 |
---------------------------------
---------------------------------
| explained_variance | 0.724    |
| fps                | 842      |
| nupdates           | 1255800  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.973    |
| fps                | 842      |
| nupdates           | 1258600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6293000  |
| value_loss         | 3.04e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.17    |
| fps                | 842      |
| nupdates           | 1258700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6293500  |
| value_loss         | 0.000211 |
---------------------------------
---------------------------------
| explained_variance | -0.887   |
| fps                | 842      |
| nupdates           | 1258800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6294000  |
| value_loss         | 6.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.246    |
| fps                | 842      |
| nupdates           | 1258900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.917    |
| fps                | 842      |
| nupdates           | 1261600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6308000  |
| value_loss         | 0.000169 |
---------------------------------
---------------------------------
| explained_variance | 0.833    |
| fps                | 842      |
| nupdates           | 1261700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6308500  |
| value_loss         | 4.49e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.909    |
| fps                | 842      |
| nupdates           | 1261800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6309000  |
| value_loss         | 2.05e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.973    |
| fps                | 842      |
| nupdates           | 1261900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.709    |
| fps                | 842      |
| nupdates           | 1264700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6323500  |
| value_loss         | 5.85e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 842      |
| nupdates           | 1264800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6324000  |
| value_loss         | 4.25e-06 |
---------------------------------
---------------------------------
| explained_variance | -2.28    |
| fps                | 842      |
| nupdates           | 1264900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6324500  |
| value_loss         | 7.65e-05 |
---------------------------------
Eval num_timesteps=6325000, episode_reward=-5.00 +/- 0.00
Episode length: 605.30 +/- 122.15
---------------------------------
| explained_variance | 0.857    |
| fps                | 8

---------------------------------
| explained_variance | 0.212    |
| fps                | 842      |
| nupdates           | 1267700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6338500  |
| value_loss         | 7.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.685    |
| fps                | 842      |
| nupdates           | 1267800  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6339000  |
| value_loss         | 6.33e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.414    |
| fps                | 842      |
| nupdates           | 1267900  |
| policy_entropy     | 1.97     |
| total_timesteps    | 6339500  |
| value_loss         | 5.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 842      |
| nupdates           | 1268000  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -0.382   |
| fps                | 842      |
| nupdates           | 1270700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6353500  |
| value_loss         | 7.43e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.279    |
| fps                | 842      |
| nupdates           | 1270800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6354000  |
| value_loss         | 0.00059  |
---------------------------------
---------------------------------
| explained_variance | 0.987    |
| fps                | 842      |
| nupdates           | 1270900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6354500  |
| value_loss         | 3.99e-06 |
---------------------------------
---------------------------------
| explained_variance | -59.6    |
| fps                | 842      |
| nupdates           | 1271000  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.578    |
| fps                | 843      |
| nupdates           | 1273800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6369000  |
| value_loss         | 0.000485 |
---------------------------------
---------------------------------
| explained_variance | 0.974    |
| fps                | 843      |
| nupdates           | 1273900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6369500  |
| value_loss         | 4.28e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.0923  |
| fps                | 843      |
| nupdates           | 1274000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6370000  |
| value_loss         | 0.000289 |
---------------------------------
---------------------------------
| explained_variance | 0.772    |
| fps                | 843      |
| nupdates           | 1274100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.699    |
| fps                | 843      |
| nupdates           | 1276800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6384000  |
| value_loss         | 0.000122 |
---------------------------------
---------------------------------
| explained_variance | 0.759    |
| fps                | 843      |
| nupdates           | 1276900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6384500  |
| value_loss         | 0.000163 |
---------------------------------
---------------------------------
| explained_variance | -6.14    |
| fps                | 843      |
| nupdates           | 1277000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6385000  |
| value_loss         | 0.000448 |
---------------------------------
---------------------------------
| explained_variance | 0.899    |
| fps                | 843      |
| nupdates           | 1277100  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.863    |
| fps                | 843      |
| nupdates           | 1279900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6399500  |
| value_loss         | 5.87e-05 |
---------------------------------
Eval num_timesteps=6400000, episode_reward=-4.80 +/- 0.40
Episode length: 735.20 +/- 175.08
---------------------------------
| explained_variance | 0.809    |
| fps                | 842      |
| nupdates           | 1280000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6400000  |
| value_loss         | 0.00114  |
---------------------------------
---------------------------------
| explained_variance | -68.4    |
| fps                | 842      |
| nupdates           | 1280100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6400500  |
| value_loss         | 0.00451  |
---------------------------------
---------------------------------
| explained_variance | 0.836    |
| fps                | 8

---------------------------------
| explained_variance | 0.725    |
| fps                | 843      |
| nupdates           | 1282900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6414500  |
| value_loss         | 0.000265 |
---------------------------------
---------------------------------
| explained_variance | -0.717   |
| fps                | 843      |
| nupdates           | 1283000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6415000  |
| value_loss         | 0.00061  |
---------------------------------
---------------------------------
| explained_variance | 0.936    |
| fps                | 843      |
| nupdates           | 1283100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6415500  |
| value_loss         | 1.7e-05  |
---------------------------------
---------------------------------
| explained_variance | -5.33    |
| fps                | 843      |
| nupdates           | 1283200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.41     |
| fps                | 842      |
| nupdates           | 1285900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6429500  |
| value_loss         | 0.0001   |
---------------------------------
---------------------------------
| explained_variance | -0.0395  |
| fps                | 842      |
| nupdates           | 1286000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6430000  |
| value_loss         | 0.000167 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 842      |
| nupdates           | 1286100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6430500  |
| value_loss         | 2.59e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 842      |
| nupdates           | 1286200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.921    |
| fps                | 843      |
| nupdates           | 1289000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6445000  |
| value_loss         | 9.14e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.539    |
| fps                | 843      |
| nupdates           | 1289100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6445500  |
| value_loss         | 0.000109 |
---------------------------------
---------------------------------
| explained_variance | -0.551   |
| fps                | 843      |
| nupdates           | 1289200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6446000  |
| value_loss         | 4.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.985    |
| fps                | 843      |
| nupdates           | 1289300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.859    |
| fps                | 843      |
| nupdates           | 1292000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6460000  |
| value_loss         | 2.6e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.247    |
| fps                | 843      |
| nupdates           | 1292100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6460500  |
| value_loss         | 0.000396 |
---------------------------------
---------------------------------
| explained_variance | -21.4    |
| fps                | 843      |
| nupdates           | 1292200  |
| policy_entropy     | 1.92     |
| total_timesteps    | 6461000  |
| value_loss         | 0.0012   |
---------------------------------
---------------------------------
| explained_variance | -0.0058  |
| fps                | 843      |
| nupdates           | 1292300  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -2.55    |
| fps                | 843      |
| nupdates           | 1295100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6475500  |
| value_loss         | 0.000147 |
---------------------------------
---------------------------------
| explained_variance | 0.474    |
| fps                | 843      |
| nupdates           | 1295200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6476000  |
| value_loss         | 0.000505 |
---------------------------------
---------------------------------
| explained_variance | -29.8    |
| fps                | 843      |
| nupdates           | 1295300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6476500  |
| value_loss         | 0.00347  |
---------------------------------
---------------------------------
| explained_variance | 0.865    |
| fps                | 843      |
| nupdates           | 1295400  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.121    |
| fps                | 843      |
| nupdates           | 1298200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6491000  |
| value_loss         | 0.00013  |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 843      |
| nupdates           | 1298300  |
| policy_entropy     | 2.01     |
| total_timesteps    | 6491500  |
| value_loss         | 3.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.365    |
| fps                | 843      |
| nupdates           | 1298400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6492000  |
| value_loss         | 0.0991   |
---------------------------------
---------------------------------
| explained_variance | 0.782    |
| fps                | 843      |
| nupdates           | 1298500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.12    |
| fps                | 843      |
| nupdates           | 1301200  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6506000  |
| value_loss         | 0.000411 |
---------------------------------
---------------------------------
| explained_variance | -2.18    |
| fps                | 843      |
| nupdates           | 1301300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6506500  |
| value_loss         | 0.000779 |
---------------------------------
---------------------------------
| explained_variance | -5.75    |
| fps                | 843      |
| nupdates           | 1301400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6507000  |
| value_loss         | 0.00502  |
---------------------------------
---------------------------------
| explained_variance | -0.298   |
| fps                | 843      |
| nupdates           | 1301500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.118   |
| fps                | 843      |
| nupdates           | 1304300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6521500  |
| value_loss         | 0.000579 |
---------------------------------
---------------------------------
| explained_variance | -1.73    |
| fps                | 843      |
| nupdates           | 1304400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6522000  |
| value_loss         | 0.00119  |
---------------------------------
---------------------------------
| explained_variance | 0.485    |
| fps                | 843      |
| nupdates           | 1304500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6522500  |
| value_loss         | 2.93e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.203   |
| fps                | 843      |
| nupdates           | 1304600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.134    |
| fps                | 843      |
| nupdates           | 1307300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6536500  |
| value_loss         | 4.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0352   |
| fps                | 843      |
| nupdates           | 1307400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6537000  |
| value_loss         | 4.24e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.804    |
| fps                | 843      |
| nupdates           | 1307500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6537500  |
| value_loss         | 1.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.505    |
| fps                | 843      |
| nupdates           | 1307600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.767    |
| fps                | 843      |
| nupdates           | 1310300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6551500  |
| value_loss         | 4.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.886    |
| fps                | 843      |
| nupdates           | 1310400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6552000  |
| value_loss         | 1.49e-06 |
---------------------------------
---------------------------------
| explained_variance | -39.3    |
| fps                | 843      |
| nupdates           | 1310500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6552500  |
| value_loss         | 0.00264  |
---------------------------------
---------------------------------
| explained_variance | 0.869    |
| fps                | 843      |
| nupdates           | 1310600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -1.2     |
| fps                | 844      |
| nupdates           | 1313400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6567000  |
| value_loss         | 0.00108  |
---------------------------------
---------------------------------
| explained_variance | 0.842    |
| fps                | 844      |
| nupdates           | 1313500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6567500  |
| value_loss         | 7.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.96    |
| fps                | 844      |
| nupdates           | 1313600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6568000  |
| value_loss         | 0.000121 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 844      |
| nupdates           | 1313700  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.533   |
| fps                | 843      |
| nupdates           | 1316400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6582000  |
| value_loss         | 0.000155 |
---------------------------------
---------------------------------
| explained_variance | 0.704    |
| fps                | 843      |
| nupdates           | 1316500  |
| policy_entropy     | 2        |
| total_timesteps    | 6582500  |
| value_loss         | 3.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.8      |
| fps                | 843      |
| nupdates           | 1316600  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6583000  |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | -3.1     |
| fps                | 844      |
| nupdates           | 1316700  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.516    |
| fps                | 844      |
| nupdates           | 1319500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6597500  |
| value_loss         | 6.07e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.146   |
| fps                | 844      |
| nupdates           | 1319600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6598000  |
| value_loss         | 0.000209 |
---------------------------------
---------------------------------
| explained_variance | 0.979    |
| fps                | 844      |
| nupdates           | 1319700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6598500  |
| value_loss         | 8.2e-06  |
---------------------------------
---------------------------------
| explained_variance | -0.0487  |
| fps                | 844      |
| nupdates           | 1319800  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.549    |
| fps                | 844      |
| nupdates           | 1322500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6612500  |
| value_loss         | 2.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.13    |
| fps                | 844      |
| nupdates           | 1322600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6613000  |
| value_loss         | 4.97e-05 |
---------------------------------
---------------------------------
| explained_variance | -8.23    |
| fps                | 844      |
| nupdates           | 1322700  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6613500  |
| value_loss         | 0.00106  |
---------------------------------
---------------------------------
| explained_variance | 0.982    |
| fps                | 844      |
| nupdates           | 1322800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.935    |
| fps                | 844      |
| nupdates           | 1325500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6627500  |
| value_loss         | 8.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.945    |
| fps                | 844      |
| nupdates           | 1325600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6628000  |
| value_loss         | 1.03e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.348    |
| fps                | 844      |
| nupdates           | 1325700  |
| policy_entropy     | 2.01     |
| total_timesteps    | 6628500  |
| value_loss         | 0.174    |
---------------------------------
---------------------------------
| explained_variance | -4.95    |
| fps                | 844      |
| nupdates           | 1325800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.905    |
| fps                | 844      |
| nupdates           | 1328600  |
| policy_entropy     | 1.92     |
| total_timesteps    | 6643000  |
| value_loss         | 0.00021  |
---------------------------------
---------------------------------
| explained_variance | 0.887    |
| fps                | 844      |
| nupdates           | 1328700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6643500  |
| value_loss         | 4.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.881    |
| fps                | 844      |
| nupdates           | 1328800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6644000  |
| value_loss         | 7.83e-05 |
---------------------------------
---------------------------------
| explained_variance | -5.72    |
| fps                | 844      |
| nupdates           | 1328900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0804  |
| fps                | 844      |
| nupdates           | 1331600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6658000  |
| value_loss         | 0.000235 |
---------------------------------
---------------------------------
| explained_variance | 0.899    |
| fps                | 844      |
| nupdates           | 1331700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6658500  |
| value_loss         | 1.46e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.557   |
| fps                | 844      |
| nupdates           | 1331800  |
| policy_entropy     | 1.99     |
| total_timesteps    | 6659000  |
| value_loss         | 0.000258 |
---------------------------------
---------------------------------
| explained_variance | -0.478   |
| fps                | 844      |
| nupdates           | 1331900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.686    |
| fps                | 844      |
| nupdates           | 1334700  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6673500  |
| value_loss         | 2.92e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 844      |
| nupdates           | 1334800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6674000  |
| value_loss         | 7.07e-07 |
---------------------------------
---------------------------------
| explained_variance | -1.18    |
| fps                | 844      |
| nupdates           | 1334900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6674500  |
| value_loss         | 0.00135  |
---------------------------------
Eval num_timesteps=6675000, episode_reward=-4.60 +/- 0.66
Episode length: 593.60 +/- 118.42
---------------------------------
| explained_variance | 0.99     |
| fps                | 8

---------------------------------
| explained_variance | -18.6    |
| fps                | 844      |
| nupdates           | 1337700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6688500  |
| value_loss         | 0.0007   |
---------------------------------
---------------------------------
| explained_variance | 0.787    |
| fps                | 844      |
| nupdates           | 1337800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6689000  |
| value_loss         | 0.00013  |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 844      |
| nupdates           | 1337900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6689500  |
| value_loss         | 3.9e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.99     |
| fps                | 844      |
| nupdates           | 1338000  |
| policy_entropy     | 1.97     |
| total_timest

---------------------------------
| explained_variance | -4.96    |
| fps                | 844      |
| nupdates           | 1340700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6703500  |
| value_loss         | 0.000904 |
---------------------------------
---------------------------------
| explained_variance | 0.668    |
| fps                | 844      |
| nupdates           | 1340800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6704000  |
| value_loss         | 1.1e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.991   |
| fps                | 844      |
| nupdates           | 1340900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6704500  |
| value_loss         | 7.96e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.00667 |
| fps                | 844      |
| nupdates           | 1341000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0395   |
| fps                | 844      |
| nupdates           | 1343800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6719000  |
| value_loss         | 0.000306 |
---------------------------------
---------------------------------
| explained_variance | 0.962    |
| fps                | 844      |
| nupdates           | 1343900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6719500  |
| value_loss         | 6.52e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.958    |
| fps                | 844      |
| nupdates           | 1344000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6720000  |
| value_loss         | 3.96e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.841    |
| fps                | 844      |
| nupdates           | 1344100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.858    |
| fps                | 844      |
| nupdates           | 1346800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6734000  |
| value_loss         | 0.00019  |
---------------------------------
---------------------------------
| explained_variance | -343     |
| fps                | 844      |
| nupdates           | 1346900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6734500  |
| value_loss         | 0.0357   |
---------------------------------
---------------------------------
| explained_variance | -6.61    |
| fps                | 844      |
| nupdates           | 1347000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6735000  |
| value_loss         | 0.00433  |
---------------------------------
---------------------------------
| explained_variance | 0.833    |
| fps                | 844      |
| nupdates           | 1347100  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.441    |
| fps                | 844      |
| nupdates           | 1349900  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6749500  |
| value_loss         | 0.135    |
---------------------------------
Eval num_timesteps=6750000, episode_reward=-4.80 +/- 0.40
Episode length: 762.80 +/- 125.80
---------------------------------
| explained_variance | 0.977    |
| fps                | 844      |
| nupdates           | 1350000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6750000  |
| value_loss         | 1.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.818    |
| fps                | 844      |
| nupdates           | 1350100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6750500  |
| value_loss         | 2.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.826    |
| fps                | 8

---------------------------------
| explained_variance | 0.573    |
| fps                | 844      |
| nupdates           | 1352900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6764500  |
| value_loss         | 0.000216 |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 844      |
| nupdates           | 1353000  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6765000  |
| value_loss         | 2.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.882    |
| fps                | 844      |
| nupdates           | 1353100  |
| policy_entropy     | 1.95     |
| total_timesteps    | 6765500  |
| value_loss         | 0.000218 |
---------------------------------
---------------------------------
| explained_variance | 0.749    |
| fps                | 844      |
| nupdates           | 1353200  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.977    |
| fps                | 844      |
| nupdates           | 1355900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6779500  |
| value_loss         | 6.34e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.1     |
| fps                | 844      |
| nupdates           | 1356000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6780000  |
| value_loss         | 0.000177 |
---------------------------------
---------------------------------
| explained_variance | 0.169    |
| fps                | 844      |
| nupdates           | 1356100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6780500  |
| value_loss         | 0.000337 |
---------------------------------
---------------------------------
| explained_variance | -2.04    |
| fps                | 844      |
| nupdates           | 1356200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.938    |
| fps                | 845      |
| nupdates           | 1359000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6795000  |
| value_loss         | 4.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.788    |
| fps                | 845      |
| nupdates           | 1359100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6795500  |
| value_loss         | 1.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.499    |
| fps                | 845      |
| nupdates           | 1359200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6796000  |
| value_loss         | 0.000146 |
---------------------------------
---------------------------------
| explained_variance | -0.743   |
| fps                | 845      |
| nupdates           | 1359300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.225    |
| fps                | 845      |
| nupdates           | 1362000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6810000  |
| value_loss         | 1.98e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.398   |
| fps                | 845      |
| nupdates           | 1362100  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6810500  |
| value_loss         | 0.000539 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 845      |
| nupdates           | 1362200  |
| policy_entropy     | 1.95     |
| total_timesteps    | 6811000  |
| value_loss         | 1.07e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.536   |
| fps                | 845      |
| nupdates           | 1362300  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.739   |
| fps                | 844      |
| nupdates           | 1365100  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6825500  |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | 0.882    |
| fps                | 844      |
| nupdates           | 1365200  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6826000  |
| value_loss         | 4.11e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.959    |
| fps                | 844      |
| nupdates           | 1365300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6826500  |
| value_loss         | 7.83e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.744    |
| fps                | 844      |
| nupdates           | 1365400  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.963    |
| fps                | 845      |
| nupdates           | 1368200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6841000  |
| value_loss         | 1.38e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.695    |
| fps                | 845      |
| nupdates           | 1368300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6841500  |
| value_loss         | 3.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 845      |
| nupdates           | 1368400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6842000  |
| value_loss         | 3.46e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.356    |
| fps                | 845      |
| nupdates           | 1368500  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.996    |
| fps                | 845      |
| nupdates           | 1371200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6856000  |
| value_loss         | 7.42e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.683    |
| fps                | 845      |
| nupdates           | 1371300  |
| policy_entropy     | 1.8      |
| total_timesteps    | 6856500  |
| value_loss         | 5.4e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.561    |
| fps                | 845      |
| nupdates           | 1371400  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6857000  |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | -0.0823  |
| fps                | 845      |
| nupdates           | 1371500  |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.962    |
| fps                | 845      |
| nupdates           | 1374300  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6871500  |
| value_loss         | 6.14e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.599    |
| fps                | 845      |
| nupdates           | 1374400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6872000  |
| value_loss         | 2.83e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.41    |
| fps                | 845      |
| nupdates           | 1374500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6872500  |
| value_loss         | 0.000637 |
---------------------------------
---------------------------------
| explained_variance | 0.867    |
| fps                | 845      |
| nupdates           | 1374600  |
| policy_entropy     | 1.76     |
| total_timest

---------------------------------
| explained_variance | 0.777    |
| fps                | 845      |
| nupdates           | 1377300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6886500  |
| value_loss         | 9.7e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.884    |
| fps                | 845      |
| nupdates           | 1377400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6887000  |
| value_loss         | 1.19e-05 |
---------------------------------
---------------------------------
| explained_variance | -20.7    |
| fps                | 845      |
| nupdates           | 1377500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6887500  |
| value_loss         | 0.00216  |
---------------------------------
---------------------------------
| explained_variance | -0.466   |
| fps                | 845      |
| nupdates           | 1377600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.369    |
| fps                | 845      |
| nupdates           | 1380300  |
| policy_entropy     | 1.94     |
| total_timesteps    | 6901500  |
| value_loss         | 0.149    |
---------------------------------
---------------------------------
| explained_variance | -5.61    |
| fps                | 845      |
| nupdates           | 1380400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6902000  |
| value_loss         | 0.00271  |
---------------------------------
---------------------------------
| explained_variance | 0.715    |
| fps                | 845      |
| nupdates           | 1380500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6902500  |
| value_loss         | 4.3e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.361   |
| fps                | 845      |
| nupdates           | 1380600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.935    |
| fps                | 845      |
| nupdates           | 1383400  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6917000  |
| value_loss         | 1.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.447    |
| fps                | 845      |
| nupdates           | 1383500  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6917500  |
| value_loss         | 0.000189 |
---------------------------------
---------------------------------
| explained_variance | 0.0433   |
| fps                | 845      |
| nupdates           | 1383600  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6918000  |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | 0.873    |
| fps                | 845      |
| nupdates           | 1383700  |
| policy_entropy     | 1.81     |
| total_timest

---------------------------------
| explained_variance | 0.761    |
| fps                | 845      |
| nupdates           | 1386400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6932000  |
| value_loss         | 4.36e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.174    |
| fps                | 845      |
| nupdates           | 1386500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6932500  |
| value_loss         | 0.000342 |
---------------------------------
---------------------------------
| explained_variance | 0.985    |
| fps                | 845      |
| nupdates           | 1386600  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6933000  |
| value_loss         | 4.56e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.806    |
| fps                | 845      |
| nupdates           | 1386700  |
| policy_entropy     | 1.81     |
| total_timest

---------------------------------
| explained_variance | 0.886    |
| fps                | 846      |
| nupdates           | 1389500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6947500  |
| value_loss         | 3.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.86     |
| fps                | 846      |
| nupdates           | 1389600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6948000  |
| value_loss         | 1.31e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.538    |
| fps                | 846      |
| nupdates           | 1389700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6948500  |
| value_loss         | 0.000348 |
---------------------------------
---------------------------------
| explained_variance | 0.445    |
| fps                | 846      |
| nupdates           | 1389800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.652   |
| fps                | 846      |
| nupdates           | 1392500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6962500  |
| value_loss         | 0.000153 |
---------------------------------
---------------------------------
| explained_variance | 0.463    |
| fps                | 846      |
| nupdates           | 1392600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6963000  |
| value_loss         | 6.99e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.675    |
| fps                | 846      |
| nupdates           | 1392700  |
| policy_entropy     | 1.6      |
| total_timesteps    | 6963500  |
| value_loss         | 0.000447 |
---------------------------------
---------------------------------
| explained_variance | 0.985    |
| fps                | 846      |
| nupdates           | 1392800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0384  |
| fps                | 846      |
| nupdates           | 1395500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6977500  |
| value_loss         | 0.000374 |
---------------------------------
---------------------------------
| explained_variance | 0.47     |
| fps                | 846      |
| nupdates           | 1395600  |
| policy_entropy     | 1.57     |
| total_timesteps    | 6978000  |
| value_loss         | 0.0002   |
---------------------------------
---------------------------------
| explained_variance | 0.836    |
| fps                | 846      |
| nupdates           | 1395700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6978500  |
| value_loss         | 2.98e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.935    |
| fps                | 846      |
| nupdates           | 1395800  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.5     |
| fps                | 846      |
| nupdates           | 1398600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6993000  |
| value_loss         | 0.000265 |
---------------------------------
---------------------------------
| explained_variance | -0.265   |
| fps                | 846      |
| nupdates           | 1398700  |
| policy_entropy     | 1.49     |
| total_timesteps    | 6993500  |
| value_loss         | 0.88     |
---------------------------------
---------------------------------
| explained_variance | -0.738   |
| fps                | 846      |
| nupdates           | 1398800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6994000  |
| value_loss         | 0.000256 |
---------------------------------
---------------------------------
| explained_variance | 0.829    |
| fps                | 846      |
| nupdates           | 1398900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.48    |
| fps                | 846      |
| nupdates           | 1401600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7008000  |
| value_loss         | 2.74e-05 |
---------------------------------
---------------------------------
| explained_variance | -66.7    |
| fps                | 846      |
| nupdates           | 1401700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7008500  |
| value_loss         | 0.00436  |
---------------------------------
---------------------------------
| explained_variance | -212     |
| fps                | 846      |
| nupdates           | 1401800  |
| policy_entropy     | 1.64     |
| total_timesteps    | 7009000  |
| value_loss         | 0.0145   |
---------------------------------
---------------------------------
| explained_variance | 0.764    |
| fps                | 846      |
| nupdates           | 1401900  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.603    |
| fps                | 846      |
| nupdates           | 1404700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7023500  |
| value_loss         | 6.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.498    |
| fps                | 846      |
| nupdates           | 1404800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7024000  |
| value_loss         | 0.000592 |
---------------------------------
---------------------------------
| explained_variance | 0.701    |
| fps                | 846      |
| nupdates           | 1404900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7024500  |
| value_loss         | 7.29e-05 |
---------------------------------
Eval num_timesteps=7025000, episode_reward=-5.00 +/- 0.00
Episode length: 573.40 +/- 69.68
---------------------------------
| explained_variance | -0.422   |
| fps                | 84

---------------------------------
| explained_variance | 0.451    |
| fps                | 846      |
| nupdates           | 1407700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7038500  |
| value_loss         | 0.000282 |
---------------------------------
---------------------------------
| explained_variance | 0.99     |
| fps                | 846      |
| nupdates           | 1407800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7039000  |
| value_loss         | 1.14e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0484   |
| fps                | 846      |
| nupdates           | 1407900  |
| policy_entropy     | 1.82     |
| total_timesteps    | 7039500  |
| value_loss         | 0.000759 |
---------------------------------
---------------------------------
| explained_variance | 0.892    |
| fps                | 846      |
| nupdates           | 1408000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.788    |
| fps                | 846      |
| nupdates           | 1410700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7053500  |
| value_loss         | 4.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.434    |
| fps                | 846      |
| nupdates           | 1410800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7054000  |
| value_loss         | 8.78e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.868    |
| fps                | 846      |
| nupdates           | 1410900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7054500  |
| value_loss         | 0.000223 |
---------------------------------
---------------------------------
| explained_variance | -3.62    |
| fps                | 846      |
| nupdates           | 1411000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.82     |
| fps                | 846      |
| nupdates           | 1413800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7069000  |
| value_loss         | 0.000181 |
---------------------------------
---------------------------------
| explained_variance | -0.165   |
| fps                | 846      |
| nupdates           | 1413900  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7069500  |
| value_loss         | 0.000146 |
---------------------------------
---------------------------------
| explained_variance | 0.968    |
| fps                | 846      |
| nupdates           | 1414000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7070000  |
| value_loss         | 2.24e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.585   |
| fps                | 847      |
| nupdates           | 1414100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -5.44    |
| fps                | 846      |
| nupdates           | 1416800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7084000  |
| value_loss         | 0.00061  |
---------------------------------
---------------------------------
| explained_variance | 0.564    |
| fps                | 846      |
| nupdates           | 1416900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7084500  |
| value_loss         | 0.000383 |
---------------------------------
---------------------------------
| explained_variance | 0.933    |
| fps                | 846      |
| nupdates           | 1417000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7085000  |
| value_loss         | 6.16e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.168    |
| fps                | 846      |
| nupdates           | 1417100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.89     |
| fps                | 847      |
| nupdates           | 1419900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7099500  |
| value_loss         | 2.71e-05 |
---------------------------------
Eval num_timesteps=7100000, episode_reward=-4.70 +/- 0.46
Episode length: 557.90 +/- 91.60
---------------------------------
| explained_variance | 0.992    |
| fps                | 846      |
| nupdates           | 1420000  |
| policy_entropy     | 2        |
| total_timesteps    | 7100000  |
| value_loss         | 2.99e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.805    |
| fps                | 846      |
| nupdates           | 1420100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7100500  |
| value_loss         | 0.000154 |
---------------------------------
---------------------------------
| explained_variance | -42.4    |
| fps                | 84

---------------------------------
| explained_variance | 0.411    |
| fps                | 847      |
| nupdates           | 1422900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7114500  |
| value_loss         | 0.153    |
---------------------------------
---------------------------------
| explained_variance | 0.82     |
| fps                | 847      |
| nupdates           | 1423000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7115000  |
| value_loss         | 3.3e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.366   |
| fps                | 847      |
| nupdates           | 1423100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7115500  |
| value_loss         | 0.000336 |
---------------------------------
---------------------------------
| explained_variance | 0.984    |
| fps                | 847      |
| nupdates           | 1423200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.57     |
| fps                | 847      |
| nupdates           | 1425900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7129500  |
| value_loss         | 2.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.811    |
| fps                | 847      |
| nupdates           | 1426000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7130000  |
| value_loss         | 8.73e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 847      |
| nupdates           | 1426100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7130500  |
| value_loss         | 2.52e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.272    |
| fps                | 847      |
| nupdates           | 1426200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.469    |
| fps                | 847      |
| nupdates           | 1429000  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7145000  |
| value_loss         | 0.0001   |
---------------------------------
---------------------------------
| explained_variance | -1.87    |
| fps                | 847      |
| nupdates           | 1429100  |
| policy_entropy     | 2        |
| total_timesteps    | 7145500  |
| value_loss         | 0.000117 |
---------------------------------
---------------------------------
| explained_variance | -4.68    |
| fps                | 847      |
| nupdates           | 1429200  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7146000  |
| value_loss         | 0.000261 |
---------------------------------
---------------------------------
| explained_variance | -4.54    |
| fps                | 847      |
| nupdates           | 1429300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.41    |
| fps                | 847      |
| nupdates           | 1432000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7160000  |
| value_loss         | 2.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.23     |
| fps                | 847      |
| nupdates           | 1432100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7160500  |
| value_loss         | 0.000112 |
---------------------------------
---------------------------------
| explained_variance | -0.614   |
| fps                | 847      |
| nupdates           | 1432200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7161000  |
| value_loss         | 0.000699 |
---------------------------------
---------------------------------
| explained_variance | 0.75     |
| fps                | 847      |
| nupdates           | 1432300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.559    |
| fps                | 847      |
| nupdates           | 1435100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7175500  |
| value_loss         | 3e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.885    |
| fps                | 847      |
| nupdates           | 1435200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7176000  |
| value_loss         | 4.18e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.607   |
| fps                | 847      |
| nupdates           | 1435300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7176500  |
| value_loss         | 0.000229 |
---------------------------------
---------------------------------
| explained_variance | -49.3    |
| fps                | 847      |
| nupdates           | 1435400  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.47    |
| fps                | 847      |
| nupdates           | 1438200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7191000  |
| value_loss         | 0.000275 |
---------------------------------
---------------------------------
| explained_variance | -7.22    |
| fps                | 847      |
| nupdates           | 1438300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7191500  |
| value_loss         | 0.000217 |
---------------------------------
---------------------------------
| explained_variance | -11.2    |
| fps                | 847      |
| nupdates           | 1438400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7192000  |
| value_loss         | 0.00794  |
---------------------------------
---------------------------------
| explained_variance | 0.572    |
| fps                | 847      |
| nupdates           | 1438500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.859    |
| fps                | 847      |
| nupdates           | 1441200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7206000  |
| value_loss         | 6.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.386    |
| fps                | 847      |
| nupdates           | 1441300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7206500  |
| value_loss         | 5.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.896    |
| fps                | 847      |
| nupdates           | 1441400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7207000  |
| value_loss         | 2.15e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.52    |
| fps                | 847      |
| nupdates           | 1441500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.782    |
| fps                | 847      |
| nupdates           | 1444300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7221500  |
| value_loss         | 0.000194 |
---------------------------------
---------------------------------
| explained_variance | 0.313    |
| fps                | 847      |
| nupdates           | 1444400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7222000  |
| value_loss         | 3.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.96     |
| fps                | 847      |
| nupdates           | 1444500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7222500  |
| value_loss         | 5.68e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 847      |
| nupdates           | 1444600  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -30.9    |
| fps                | 847      |
| nupdates           | 1447300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7236500  |
| value_loss         | 0.0069   |
---------------------------------
---------------------------------
| explained_variance | 0.999    |
| fps                | 847      |
| nupdates           | 1447400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7237000  |
| value_loss         | 7.39e-08 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 847      |
| nupdates           | 1447500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7237500  |
| value_loss         | 9.69e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.943    |
| fps                | 847      |
| nupdates           | 1447600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.995    |
| fps                | 847      |
| nupdates           | 1450300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7251500  |
| value_loss         | 7.93e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.568    |
| fps                | 847      |
| nupdates           | 1450400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7252000  |
| value_loss         | 0.000284 |
---------------------------------
---------------------------------
| explained_variance | 0.613    |
| fps                | 847      |
| nupdates           | 1450500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7252500  |
| value_loss         | 1.04e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.22    |
| fps                | 847      |
| nupdates           | 1450600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.958    |
| fps                | 848      |
| nupdates           | 1453400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7267000  |
| value_loss         | 5.26e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.365    |
| fps                | 848      |
| nupdates           | 1453500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7267500  |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | 0.748    |
| fps                | 848      |
| nupdates           | 1453600  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7268000  |
| value_loss         | 3.32e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 848      |
| nupdates           | 1453700  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -5.99    |
| fps                | 847      |
| nupdates           | 1456400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7282000  |
| value_loss         | 0.00181  |
---------------------------------
---------------------------------
| explained_variance | -2.44    |
| fps                | 847      |
| nupdates           | 1456500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7282500  |
| value_loss         | 0.000185 |
---------------------------------
---------------------------------
| explained_variance | 0.737    |
| fps                | 847      |
| nupdates           | 1456600  |
| policy_entropy     | 1.99     |
| total_timesteps    | 7283000  |
| value_loss         | 0.000178 |
---------------------------------
---------------------------------
| explained_variance | -0.579   |
| fps                | 847      |
| nupdates           | 1456700  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.589   |
| fps                | 848      |
| nupdates           | 1459500  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7297500  |
| value_loss         | 0.000359 |
---------------------------------
---------------------------------
| explained_variance | 0.196    |
| fps                | 848      |
| nupdates           | 1459600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7298000  |
| value_loss         | 4.19e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.213    |
| fps                | 848      |
| nupdates           | 1459700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7298500  |
| value_loss         | 0.000299 |
---------------------------------
---------------------------------
| explained_variance | 0.922    |
| fps                | 848      |
| nupdates           | 1459800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -74.9    |
| fps                | 848      |
| nupdates           | 1462500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7312500  |
| value_loss         | 0.00958  |
---------------------------------
---------------------------------
| explained_variance | -2.22    |
| fps                | 848      |
| nupdates           | 1462600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7313000  |
| value_loss         | 3.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 848      |
| nupdates           | 1462700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7313500  |
| value_loss         | 7.07e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.513   |
| fps                | 848      |
| nupdates           | 1462800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.651    |
| fps                | 848      |
| nupdates           | 1465500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7327500  |
| value_loss         | 4.34e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.652    |
| fps                | 848      |
| nupdates           | 1465600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7328000  |
| value_loss         | 0.000223 |
---------------------------------
---------------------------------
| explained_variance | 0.885    |
| fps                | 848      |
| nupdates           | 1465700  |
| policy_entropy     | 1.97     |
| total_timesteps    | 7328500  |
| value_loss         | 1.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.027    |
| fps                | 848      |
| nupdates           | 1465800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -109     |
| fps                | 848      |
| nupdates           | 1468600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7343000  |
| value_loss         | 0.000992 |
---------------------------------
---------------------------------
| explained_variance | -0.359   |
| fps                | 848      |
| nupdates           | 1468700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7343500  |
| value_loss         | 0.000321 |
---------------------------------
---------------------------------
| explained_variance | 0.951    |
| fps                | 848      |
| nupdates           | 1468800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7344000  |
| value_loss         | 4.12e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.917    |
| fps                | 848      |
| nupdates           | 1468900  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.0936   |
| fps                | 848      |
| nupdates           | 1471600  |
| policy_entropy     | 1.53     |
| total_timesteps    | 7358000  |
| value_loss         | 0.904    |
---------------------------------
---------------------------------
| explained_variance | -43      |
| fps                | 848      |
| nupdates           | 1471700  |
| policy_entropy     | 1.94     |
| total_timesteps    | 7358500  |
| value_loss         | 0.00647  |
---------------------------------
---------------------------------
| explained_variance | 0.984    |
| fps                | 848      |
| nupdates           | 1471800  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7359000  |
| value_loss         | 3.35e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0116   |
| fps                | 848      |
| nupdates           | 1471900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.167    |
| fps                | 848      |
| nupdates           | 1474700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7373500  |
| value_loss         | 3.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.2      |
| fps                | 848      |
| nupdates           | 1474800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7374000  |
| value_loss         | 3.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.185    |
| fps                | 848      |
| nupdates           | 1474900  |
| policy_entropy     | 1.9      |
| total_timesteps    | 7374500  |
| value_loss         | 0.312    |
---------------------------------
Eval num_timesteps=7375000, episode_reward=-4.90 +/- 0.30
Episode length: 661.90 +/- 111.40
---------------------------------
| explained_variance | -0.641   |
| fps                | 8

---------------------------------
| explained_variance | 0.991    |
| fps                | 848      |
| nupdates           | 1477700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7388500  |
| value_loss         | 2.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0984   |
| fps                | 848      |
| nupdates           | 1477800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7389000  |
| value_loss         | 4.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.48    |
| fps                | 848      |
| nupdates           | 1477900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7389500  |
| value_loss         | 0.00122  |
---------------------------------
---------------------------------
| explained_variance | 0.101    |
| fps                | 848      |
| nupdates           | 1478000  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.284    |
| fps                | 848      |
| nupdates           | 1480700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7403500  |
| value_loss         | 2.21e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0957   |
| fps                | 848      |
| nupdates           | 1480800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7404000  |
| value_loss         | 0.000394 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 848      |
| nupdates           | 1480900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7404500  |
| value_loss         | 6.35e-06 |
---------------------------------
---------------------------------
| explained_variance | -6.14    |
| fps                | 848      |
| nupdates           | 1481000  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.493    |
| fps                | 848      |
| nupdates           | 1483800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7419000  |
| value_loss         | 0.000339 |
---------------------------------
---------------------------------
| explained_variance | 0.896    |
| fps                | 848      |
| nupdates           | 1483900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7419500  |
| value_loss         | 1.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.87     |
| fps                | 848      |
| nupdates           | 1484000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7420000  |
| value_loss         | 4.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.293    |
| fps                | 848      |
| nupdates           | 1484100  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.397    |
| fps                | 848      |
| nupdates           | 1486800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7434000  |
| value_loss         | 0.000362 |
---------------------------------
---------------------------------
| explained_variance | -0.939   |
| fps                | 848      |
| nupdates           | 1486900  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7434500  |
| value_loss         | 0.00136  |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 848      |
| nupdates           | 1487000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7435000  |
| value_loss         | 4.49e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.842    |
| fps                | 848      |
| nupdates           | 1487100  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.953    |
| fps                | 848      |
| nupdates           | 1489900  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7449500  |
| value_loss         | 3.97e-05 |
---------------------------------
Eval num_timesteps=7450000, episode_reward=-5.00 +/- 0.00
Episode length: 559.90 +/- 120.27
---------------------------------
| explained_variance | 0.625    |
| fps                | 848      |
| nupdates           | 1490000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7450000  |
| value_loss         | 2.99e-06 |
---------------------------------
---------------------------------
| explained_variance | -7.47    |
| fps                | 848      |
| nupdates           | 1490100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7450500  |
| value_loss         | 0.00237  |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 8

---------------------------------
| explained_variance | 0.0836   |
| fps                | 848      |
| nupdates           | 1492900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7464500  |
| value_loss         | 7.64e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.3     |
| fps                | 848      |
| nupdates           | 1493000  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7465000  |
| value_loss         | 5.77e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.197   |
| fps                | 848      |
| nupdates           | 1493100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7465500  |
| value_loss         | 0.000243 |
---------------------------------
---------------------------------
| explained_variance | 0.625    |
| fps                | 848      |
| nupdates           | 1493200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -2.52    |
| fps                | 848      |
| nupdates           | 1495900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7479500  |
| value_loss         | 0.000276 |
---------------------------------
---------------------------------
| explained_variance | 0.719    |
| fps                | 848      |
| nupdates           | 1496000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7480000  |
| value_loss         | 0.000263 |
---------------------------------
---------------------------------
| explained_variance | -3.05    |
| fps                | 848      |
| nupdates           | 1496100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7480500  |
| value_loss         | 0.00107  |
---------------------------------
---------------------------------
| explained_variance | 0.583    |
| fps                | 848      |
| nupdates           | 1496200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -3.72    |
| fps                | 848      |
| nupdates           | 1499000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7495000  |
| value_loss         | 6.81e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0843  |
| fps                | 848      |
| nupdates           | 1499100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7495500  |
| value_loss         | 0.0003   |
---------------------------------
---------------------------------
| explained_variance | 0.913    |
| fps                | 848      |
| nupdates           | 1499200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7496000  |
| value_loss         | 3.69e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0958   |
| fps                | 848      |
| nupdates           | 1499300  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.964    |
| fps                | 848      |
| nupdates           | 1502000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7510000  |
| value_loss         | 6.71e-06 |
---------------------------------
---------------------------------
| explained_variance | -9.16    |
| fps                | 848      |
| nupdates           | 1502100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7510500  |
| value_loss         | 0.00311  |
---------------------------------
---------------------------------
| explained_variance | 0.6      |
| fps                | 848      |
| nupdates           | 1502200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7511000  |
| value_loss         | 0.00014  |
---------------------------------
---------------------------------
| explained_variance | -3.74    |
| fps                | 848      |
| nupdates           | 1502300  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.963    |
| fps                | 848      |
| nupdates           | 1505100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7525500  |
| value_loss         | 2.84e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.326   |
| fps                | 848      |
| nupdates           | 1505200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7526000  |
| value_loss         | 9.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.273    |
| fps                | 848      |
| nupdates           | 1505300  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7526500  |
| value_loss         | 0.000741 |
---------------------------------
---------------------------------
| explained_variance | -12.4    |
| fps                | 848      |
| nupdates           | 1505400  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1       |
| fps                | 848      |
| nupdates           | 1508200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7541000  |
| value_loss         | 9.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0148   |
| fps                | 848      |
| nupdates           | 1508300  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7541500  |
| value_loss         | 0.156    |
---------------------------------
---------------------------------
| explained_variance | -0.288   |
| fps                | 848      |
| nupdates           | 1508400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7542000  |
| value_loss         | 2.54e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.022   |
| fps                | 848      |
| nupdates           | 1508500  |
| policy_entropy     | 1.7      |
| total_timest

---------------------------------
| explained_variance | -1.43    |
| fps                | 848      |
| nupdates           | 1511200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7556000  |
| value_loss         | 0.00012  |
---------------------------------
---------------------------------
| explained_variance | 0.56     |
| fps                | 848      |
| nupdates           | 1511300  |
| policy_entropy     | 1.77     |
| total_timesteps    | 7556500  |
| value_loss         | 2.85e-05 |
---------------------------------
---------------------------------
| explained_variance | -40.9    |
| fps                | 848      |
| nupdates           | 1511400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7557000  |
| value_loss         | 0.00572  |
---------------------------------
---------------------------------
| explained_variance | -0.0753  |
| fps                | 848      |
| nupdates           | 1511500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.898    |
| fps                | 848      |
| nupdates           | 1514300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7571500  |
| value_loss         | 2.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.233    |
| fps                | 848      |
| nupdates           | 1514400  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7572000  |
| value_loss         | 0.000115 |
---------------------------------
---------------------------------
| explained_variance | -7.47    |
| fps                | 848      |
| nupdates           | 1514500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7572500  |
| value_loss         | 0.00112  |
---------------------------------
---------------------------------
| explained_variance | 0.963    |
| fps                | 848      |
| nupdates           | 1514600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.797    |
| fps                | 848      |
| nupdates           | 1517300  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7586500  |
| value_loss         | 6.81e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.933    |
| fps                | 848      |
| nupdates           | 1517400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7587000  |
| value_loss         | 5.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.349    |
| fps                | 848      |
| nupdates           | 1517500  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7587500  |
| value_loss         | 0.171    |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 848      |
| nupdates           | 1517600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.958    |
| fps                | 848      |
| nupdates           | 1520300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7601500  |
| value_loss         | 2e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.197    |
| fps                | 848      |
| nupdates           | 1520400  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7602000  |
| value_loss         | 5.44e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.985    |
| fps                | 848      |
| nupdates           | 1520500  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7602500  |
| value_loss         | 1.6e-05  |
---------------------------------
---------------------------------
| explained_variance | -4.92    |
| fps                | 848      |
| nupdates           | 1520600  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.999    |
| fps                | 848      |
| nupdates           | 1523400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7617000  |
| value_loss         | 1.53e-06 |
---------------------------------
---------------------------------
| explained_variance | -2.75    |
| fps                | 848      |
| nupdates           | 1523500  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7617500  |
| value_loss         | 0.000233 |
---------------------------------
---------------------------------
| explained_variance | 0.681    |
| fps                | 848      |
| nupdates           | 1523600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7618000  |
| value_loss         | 4.72e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.996   |
| fps                | 848      |
| nupdates           | 1523700  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.869    |
| fps                | 848      |
| nupdates           | 1526400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7632000  |
| value_loss         | 2.43e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.963    |
| fps                | 848      |
| nupdates           | 1526500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7632500  |
| value_loss         | 6.05e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.703    |
| fps                | 848      |
| nupdates           | 1526600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7633000  |
| value_loss         | 3.33e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.537    |
| fps                | 848      |
| nupdates           | 1526700  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.7      |
| fps                | 848      |
| nupdates           | 1529500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7647500  |
| value_loss         | 6.32e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 848      |
| nupdates           | 1529600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7648000  |
| value_loss         | 1.41e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.157    |
| fps                | 849      |
| nupdates           | 1529700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7648500  |
| value_loss         | 0.000254 |
---------------------------------
---------------------------------
| explained_variance | 0.92     |
| fps                | 849      |
| nupdates           | 1529800  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.918    |
| fps                | 848      |
| nupdates           | 1532500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7662500  |
| value_loss         | 3.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.988    |
| fps                | 848      |
| nupdates           | 1532600  |
| policy_entropy     | 1.97     |
| total_timesteps    | 7663000  |
| value_loss         | 1.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.77     |
| fps                | 848      |
| nupdates           | 1532700  |
| policy_entropy     | 1.99     |
| total_timesteps    | 7663500  |
| value_loss         | 0.000545 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 848      |
| nupdates           | 1532800  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.138    |
| fps                | 848      |
| nupdates           | 1535500  |
| policy_entropy     | 1.99     |
| total_timesteps    | 7677500  |
| value_loss         | 0.000125 |
---------------------------------
---------------------------------
| explained_variance | 0.905    |
| fps                | 848      |
| nupdates           | 1535600  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7678000  |
| value_loss         | 1.32e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.31    |
| fps                | 848      |
| nupdates           | 1535700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7678500  |
| value_loss         | 0.000993 |
---------------------------------
---------------------------------
| explained_variance | -12.9    |
| fps                | 848      |
| nupdates           | 1535800  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.302    |
| fps                | 849      |
| nupdates           | 1538600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7693000  |
| value_loss         | 3.6e-05  |
---------------------------------
---------------------------------
| explained_variance | -2.56    |
| fps                | 849      |
| nupdates           | 1538700  |
| policy_entropy     | 1.98     |
| total_timesteps    | 7693500  |
| value_loss         | 0.00259  |
---------------------------------
---------------------------------
| explained_variance | 0.955    |
| fps                | 849      |
| nupdates           | 1538800  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7694000  |
| value_loss         | 6.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.217    |
| fps                | 849      |
| nupdates           | 1538900  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.485   |
| fps                | 848      |
| nupdates           | 1541600  |
| policy_entropy     | 1.93     |
| total_timesteps    | 7708000  |
| value_loss         | 0.00048  |
---------------------------------
---------------------------------
| explained_variance | -0.437   |
| fps                | 848      |
| nupdates           | 1541700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7708500  |
| value_loss         | 0.000605 |
---------------------------------
---------------------------------
| explained_variance | 0.889    |
| fps                | 848      |
| nupdates           | 1541800  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7709000  |
| value_loss         | 1.27e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.502   |
| fps                | 848      |
| nupdates           | 1541900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0721   |
| fps                | 849      |
| nupdates           | 1544700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7723500  |
| value_loss         | 0.000184 |
---------------------------------
---------------------------------
| explained_variance | 0.489    |
| fps                | 849      |
| nupdates           | 1544800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7724000  |
| value_loss         | 0.000335 |
---------------------------------
---------------------------------
| explained_variance | 0.13     |
| fps                | 849      |
| nupdates           | 1544900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7724500  |
| value_loss         | 7.72e-05 |
---------------------------------
Eval num_timesteps=7725000, episode_reward=-4.80 +/- 0.40
Episode length: 650.60 +/- 111.86
---------------------------------
| explained_variance | -2.26    |
| fps                | 8

---------------------------------
| explained_variance | 0.689    |
| fps                | 849      |
| nupdates           | 1547700  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7738500  |
| value_loss         | 0.000299 |
---------------------------------
---------------------------------
| explained_variance | 0.452    |
| fps                | 849      |
| nupdates           | 1547800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7739000  |
| value_loss         | 4.27e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.16    |
| fps                | 849      |
| nupdates           | 1547900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7739500  |
| value_loss         | 2.7e-05  |
---------------------------------
---------------------------------
| explained_variance | -3       |
| fps                | 849      |
| nupdates           | 1548000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.747    |
| fps                | 849      |
| nupdates           | 1550700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7753500  |
| value_loss         | 5.14e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0259  |
| fps                | 849      |
| nupdates           | 1550800  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7754000  |
| value_loss         | 0.000396 |
---------------------------------
---------------------------------
| explained_variance | 0.999    |
| fps                | 849      |
| nupdates           | 1550900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7754500  |
| value_loss         | 3.95e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.942    |
| fps                | 849      |
| nupdates           | 1551000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.77    |
| fps                | 849      |
| nupdates           | 1553800  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7769000  |
| value_loss         | 4.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.361    |
| fps                | 849      |
| nupdates           | 1553900  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7769500  |
| value_loss         | 3.95e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.193    |
| fps                | 849      |
| nupdates           | 1554000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7770000  |
| value_loss         | 5.21e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.737    |
| fps                | 849      |
| nupdates           | 1554100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.0893   |
| fps                | 849      |
| nupdates           | 1556800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7784000  |
| value_loss         | 0.000413 |
---------------------------------
---------------------------------
| explained_variance | -0.0832  |
| fps                | 849      |
| nupdates           | 1556900  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7784500  |
| value_loss         | 0.0944   |
---------------------------------
---------------------------------
| explained_variance | -0.441   |
| fps                | 849      |
| nupdates           | 1557000  |
| policy_entropy     | 1.99     |
| total_timesteps    | 7785000  |
| value_loss         | 0.000182 |
---------------------------------
---------------------------------
| explained_variance | -0.00836 |
| fps                | 849      |
| nupdates           | 1557100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.943    |
| fps                | 849      |
| nupdates           | 1559900  |
| policy_entropy     | 1.92     |
| total_timesteps    | 7799500  |
| value_loss         | 0.000132 |
---------------------------------
Eval num_timesteps=7800000, episode_reward=-5.00 +/- 0.00
Episode length: 589.20 +/- 122.52
---------------------------------
| explained_variance | 0.954    |
| fps                | 849      |
| nupdates           | 1560000  |
| policy_entropy     | 1.98     |
| total_timesteps    | 7800000  |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | 0.575    |
| fps                | 849      |
| nupdates           | 1560100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7800500  |
| value_loss         | 0.000196 |
---------------------------------
---------------------------------
| explained_variance | -22.6    |
| fps                | 8

---------------------------------
| explained_variance | -0.922   |
| fps                | 849      |
| nupdates           | 1562900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7814500  |
| value_loss         | 0.000202 |
---------------------------------
---------------------------------
| explained_variance | 0.0149   |
| fps                | 849      |
| nupdates           | 1563000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7815000  |
| value_loss         | 0.000534 |
---------------------------------
---------------------------------
| explained_variance | -14.2    |
| fps                | 849      |
| nupdates           | 1563100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7815500  |
| value_loss         | 0.000958 |
---------------------------------
---------------------------------
| explained_variance | 0.95     |
| fps                | 849      |
| nupdates           | 1563200  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.324    |
| fps                | 849      |
| nupdates           | 1565900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7829500  |
| value_loss         | 0.000195 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 849      |
| nupdates           | 1566000  |
| policy_entropy     | 1.98     |
| total_timesteps    | 7830000  |
| value_loss         | 6.46e-07 |
---------------------------------
---------------------------------
| explained_variance | -2.6     |
| fps                | 849      |
| nupdates           | 1566100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7830500  |
| value_loss         | 0.000282 |
---------------------------------
---------------------------------
| explained_variance | 0.718    |
| fps                | 849      |
| nupdates           | 1566200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.954   |
| fps                | 849      |
| nupdates           | 1569000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7845000  |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | 0.955    |
| fps                | 849      |
| nupdates           | 1569100  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7845500  |
| value_loss         | 6.74e-05 |
---------------------------------
---------------------------------
| explained_variance | -13.2    |
| fps                | 849      |
| nupdates           | 1569200  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7846000  |
| value_loss         | 0.00323  |
---------------------------------
---------------------------------
| explained_variance | 0.938    |
| fps                | 849      |
| nupdates           | 1569300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -190     |
| fps                | 849      |
| nupdates           | 1572000  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7860000  |
| value_loss         | 0.0273   |
---------------------------------
---------------------------------
| explained_variance | 0.929    |
| fps                | 849      |
| nupdates           | 1572100  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7860500  |
| value_loss         | 8.29e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.623    |
| fps                | 849      |
| nupdates           | 1572200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7861000  |
| value_loss         | 7.96e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.37    |
| fps                | 849      |
| nupdates           | 1572300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.743    |
| fps                | 849      |
| nupdates           | 1575100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7875500  |
| value_loss         | 1.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 849      |
| nupdates           | 1575200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7876000  |
| value_loss         | 8.7e-06  |
---------------------------------
---------------------------------
| explained_variance | -1.89    |
| fps                | 849      |
| nupdates           | 1575300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7876500  |
| value_loss         | 0.00276  |
---------------------------------
---------------------------------
| explained_variance | -0.682   |
| fps                | 849      |
| nupdates           | 1575400  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -11.1    |
| fps                | 849      |
| nupdates           | 1578200  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7891000  |
| value_loss         | 0.00355  |
---------------------------------
---------------------------------
| explained_variance | 0.651    |
| fps                | 849      |
| nupdates           | 1578300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7891500  |
| value_loss         | 3.52e-06 |
---------------------------------
---------------------------------
| explained_variance | -17.2    |
| fps                | 849      |
| nupdates           | 1578400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7892000  |
| value_loss         | 0.00236  |
---------------------------------
---------------------------------
| explained_variance | 0.618    |
| fps                | 849      |
| nupdates           | 1578500  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -23.8    |
| fps                | 849      |
| nupdates           | 1581200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7906000  |
| value_loss         | 0.00323  |
---------------------------------
---------------------------------
| explained_variance | -2.59    |
| fps                | 849      |
| nupdates           | 1581300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7906500  |
| value_loss         | 0.00138  |
---------------------------------
---------------------------------
| explained_variance | 0.648    |
| fps                | 849      |
| nupdates           | 1581400  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7907000  |
| value_loss         | 0.000584 |
---------------------------------
---------------------------------
| explained_variance | 0.886    |
| fps                | 849      |
| nupdates           | 1581500  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.703    |
| fps                | 849      |
| nupdates           | 1584300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7921500  |
| value_loss         | 5.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0533   |
| fps                | 849      |
| nupdates           | 1584400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7922000  |
| value_loss         | 3.03e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.179   |
| fps                | 849      |
| nupdates           | 1584500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7922500  |
| value_loss         | 0.000438 |
---------------------------------
---------------------------------
| explained_variance | 0.948    |
| fps                | 849      |
| nupdates           | 1584600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.7      |
| fps                | 849      |
| nupdates           | 1587300  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7936500  |
| value_loss         | 0.000233 |
---------------------------------
---------------------------------
| explained_variance | -3.82    |
| fps                | 849      |
| nupdates           | 1587400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7937000  |
| value_loss         | 0.00168  |
---------------------------------
---------------------------------
| explained_variance | -0.18    |
| fps                | 849      |
| nupdates           | 1587500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7937500  |
| value_loss         | 6.16e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.277   |
| fps                | 849      |
| nupdates           | 1587600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.971    |
| fps                | 849      |
| nupdates           | 1590300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7951500  |
| value_loss         | 3.88e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.762    |
| fps                | 849      |
| nupdates           | 1590400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7952000  |
| value_loss         | 1.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.947    |
| fps                | 849      |
| nupdates           | 1590500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7952500  |
| value_loss         | 5.5e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.84     |
| fps                | 849      |
| nupdates           | 1590600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.931    |
| fps                | 849      |
| nupdates           | 1593400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7967000  |
| value_loss         | 2.51e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.554    |
| fps                | 849      |
| nupdates           | 1593500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7967500  |
| value_loss         | 6.97e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.908    |
| fps                | 849      |
| nupdates           | 1593600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7968000  |
| value_loss         | 2.42e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.331   |
| fps                | 849      |
| nupdates           | 1593700  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -18.3    |
| fps                | 849      |
| nupdates           | 1596400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7982000  |
| value_loss         | 0.0022   |
---------------------------------
---------------------------------
| explained_variance | 0.78     |
| fps                | 849      |
| nupdates           | 1596500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7982500  |
| value_loss         | 0.000152 |
---------------------------------
---------------------------------
| explained_variance | 0.623    |
| fps                | 849      |
| nupdates           | 1596600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7983000  |
| value_loss         | 0.000182 |
---------------------------------
---------------------------------
| explained_variance | 0.643    |
| fps                | 849      |
| nupdates           | 1596700  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.684    |
| fps                | 849      |
| nupdates           | 1599500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7997500  |
| value_loss         | 2.03e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0321   |
| fps                | 849      |
| nupdates           | 1599600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7998000  |
| value_loss         | 0.000164 |
---------------------------------
---------------------------------
| explained_variance | 0.292    |
| fps                | 849      |
| nupdates           | 1599700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7998500  |
| value_loss         | 0.00039  |
---------------------------------
---------------------------------
| explained_variance | -2.78    |
| fps                | 849      |
| nupdates           | 1599800  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.998    |
| fps                | 849      |
| nupdates           | 1602500  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8012500  |
| value_loss         | 2.72e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.928    |
| fps                | 849      |
| nupdates           | 1602600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8013000  |
| value_loss         | 1.73e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.961    |
| fps                | 849      |
| nupdates           | 1602700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8013500  |
| value_loss         | 5.97e-06 |
---------------------------------
---------------------------------
| explained_variance | -54.7    |
| fps                | 849      |
| nupdates           | 1602800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -86.9    |
| fps                | 849      |
| nupdates           | 1605500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8027500  |
| value_loss         | 0.0114   |
---------------------------------
----------------------------------
| explained_variance | -1.26e+03 |
| fps                | 849       |
| nupdates           | 1605600   |
| policy_entropy     | 2.05      |
| total_timesteps    | 8028000   |
| value_loss         | 0.189     |
----------------------------------
---------------------------------
| explained_variance | -0.439   |
| fps                | 849      |
| nupdates           | 1605700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8028500  |
| value_loss         | 0.000276 |
---------------------------------
---------------------------------
| explained_variance | -0.33    |
| fps                | 849      |
| nupdates           | 1605800  |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | 0.0194   |
| fps                | 849      |
| nupdates           | 1608600  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8043000  |
| value_loss         | 0.000734 |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 849      |
| nupdates           | 1608700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8043500  |
| value_loss         | 1.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.926    |
| fps                | 849      |
| nupdates           | 1608800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8044000  |
| value_loss         | 5.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.652    |
| fps                | 849      |
| nupdates           | 1608900  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -6.82    |
| fps                | 849      |
| nupdates           | 1611600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8058000  |
| value_loss         | 0.00226  |
---------------------------------
---------------------------------
| explained_variance | 0.911    |
| fps                | 849      |
| nupdates           | 1611700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8058500  |
| value_loss         | 5.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.35     |
| fps                | 849      |
| nupdates           | 1611800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8059000  |
| value_loss         | 0.000133 |
---------------------------------
---------------------------------
| explained_variance | -0.505   |
| fps                | 849      |
| nupdates           | 1611900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.581    |
| fps                | 850      |
| nupdates           | 1614700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8073500  |
| value_loss         | 2.09e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 850      |
| nupdates           | 1614800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8074000  |
| value_loss         | 5.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 850      |
| nupdates           | 1614900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8074500  |
| value_loss         | 1e-05    |
---------------------------------
Eval num_timesteps=8075000, episode_reward=-4.90 +/- 0.30
Episode length: 560.10 +/- 146.16
---------------------------------
| explained_variance | -4.07    |
| fps                | 8

---------------------------------
| explained_variance | -15.9    |
| fps                | 850      |
| nupdates           | 1617700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8088500  |
| value_loss         | 0.000409 |
---------------------------------
---------------------------------
| explained_variance | 0.902    |
| fps                | 850      |
| nupdates           | 1617800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8089000  |
| value_loss         | 7.84e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.186   |
| fps                | 850      |
| nupdates           | 1617900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8089500  |
| value_loss         | 9.1e-05  |
---------------------------------
---------------------------------
| explained_variance | -7.7     |
| fps                | 850      |
| nupdates           | 1618000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.511    |
| fps                | 850      |
| nupdates           | 1620700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8103500  |
| value_loss         | 0.000109 |
---------------------------------
---------------------------------
| explained_variance | -1.4     |
| fps                | 850      |
| nupdates           | 1620800  |
| policy_entropy     | 2.02     |
| total_timesteps    | 8104000  |
| value_loss         | 0.00179  |
---------------------------------
---------------------------------
| explained_variance | 0.938    |
| fps                | 850      |
| nupdates           | 1620900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8104500  |
| value_loss         | 2.75e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.456   |
| fps                | 850      |
| nupdates           | 1621000  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.231   |
| fps                | 850      |
| nupdates           | 1623800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8119000  |
| value_loss         | 0.000168 |
---------------------------------
----------------------------------
| explained_variance | -1.35e+03 |
| fps                | 850       |
| nupdates           | 1623900   |
| policy_entropy     | 1.82      |
| total_timesteps    | 8119500   |
| value_loss         | 0.0827    |
----------------------------------
---------------------------------
| explained_variance | -6.21    |
| fps                | 850      |
| nupdates           | 1624000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8120000  |
| value_loss         | 0.00326  |
---------------------------------
---------------------------------
| explained_variance | -4.77    |
| fps                | 850      |
| nupdates           | 1624100  |
| policy_entropy     | 2.07     |
| tota

---------------------------------
| explained_variance | -0.228   |
| fps                | 850      |
| nupdates           | 1626800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8134000  |
| value_loss         | 0.000156 |
---------------------------------
---------------------------------
| explained_variance | 0.702    |
| fps                | 850      |
| nupdates           | 1626900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8134500  |
| value_loss         | 7.86e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.987    |
| fps                | 850      |
| nupdates           | 1627000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8135000  |
| value_loss         | 3.7e-06  |
---------------------------------
---------------------------------
| explained_variance | -0.00464 |
| fps                | 850      |
| nupdates           | 1627100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.393    |
| fps                | 850      |
| nupdates           | 1629900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8149500  |
| value_loss         | 0.00053  |
---------------------------------
Eval num_timesteps=8150000, episode_reward=-4.90 +/- 0.30
Episode length: 603.60 +/- 129.17
---------------------------------
| explained_variance | -0.00103 |
| fps                | 850      |
| nupdates           | 1630000  |
| policy_entropy     | 0.817    |
| total_timesteps    | 8150000  |
| value_loss         | 0.157    |
---------------------------------
---------------------------------
| explained_variance | -1.17    |
| fps                | 850      |
| nupdates           | 1630100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8150500  |
| value_loss         | 5.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.269    |
| fps                | 8

---------------------------------
| explained_variance | 0.793    |
| fps                | 850      |
| nupdates           | 1632900  |
| policy_entropy     | 1.82     |
| total_timesteps    | 8164500  |
| value_loss         | 0.0003   |
---------------------------------
---------------------------------
| explained_variance | 0.785    |
| fps                | 850      |
| nupdates           | 1633000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8165000  |
| value_loss         | 1.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.747    |
| fps                | 850      |
| nupdates           | 1633100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8165500  |
| value_loss         | 6.97e-06 |
---------------------------------
---------------------------------
| explained_variance | -47.7    |
| fps                | 850      |
| nupdates           | 1633200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.808    |
| fps                | 850      |
| nupdates           | 1635900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8179500  |
| value_loss         | 3.31e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.857    |
| fps                | 850      |
| nupdates           | 1636000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8180000  |
| value_loss         | 2.73e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.246    |
| fps                | 850      |
| nupdates           | 1636100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8180500  |
| value_loss         | 0.000173 |
---------------------------------
---------------------------------
| explained_variance | 0.953    |
| fps                | 850      |
| nupdates           | 1636200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.0358  |
| fps                | 850      |
| nupdates           | 1639000  |
| policy_entropy     | 1.98     |
| total_timesteps    | 8195000  |
| value_loss         | 0.00132  |
---------------------------------
---------------------------------
| explained_variance | 0.897    |
| fps                | 850      |
| nupdates           | 1639100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8195500  |
| value_loss         | 1.51e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.713    |
| fps                | 850      |
| nupdates           | 1639200  |
| policy_entropy     | 2.01     |
| total_timesteps    | 8196000  |
| value_loss         | 0.000426 |
---------------------------------
---------------------------------
| explained_variance | 0.978    |
| fps                | 850      |
| nupdates           | 1639300  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.424    |
| fps                | 850      |
| nupdates           | 1642000  |
| policy_entropy     | 1.82     |
| total_timesteps    | 8210000  |
| value_loss         | 0.15     |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 850      |
| nupdates           | 1642100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8210500  |
| value_loss         | 7.28e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.0067  |
| fps                | 850      |
| nupdates           | 1642200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8211000  |
| value_loss         | 0.000313 |
---------------------------------
---------------------------------
| explained_variance | -7.76    |
| fps                | 850      |
| nupdates           | 1642300  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.395    |
| fps                | 850      |
| nupdates           | 1645100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8225500  |
| value_loss         | 0.000724 |
---------------------------------
---------------------------------
| explained_variance | -25      |
| fps                | 850      |
| nupdates           | 1645200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8226000  |
| value_loss         | 0.00693  |
---------------------------------
---------------------------------
| explained_variance | -38.1    |
| fps                | 850      |
| nupdates           | 1645300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8226500  |
| value_loss         | 0.00212  |
---------------------------------
---------------------------------
| explained_variance | 0.358    |
| fps                | 850      |
| nupdates           | 1645400  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.243    |
| fps                | 850      |
| nupdates           | 1648200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8241000  |
| value_loss         | 0.000171 |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 850      |
| nupdates           | 1648300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8241500  |
| value_loss         | 0.000753 |
---------------------------------
---------------------------------
| explained_variance | -45.3    |
| fps                | 850      |
| nupdates           | 1648400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8242000  |
| value_loss         | 0.00342  |
---------------------------------
---------------------------------
| explained_variance | 0.583    |
| fps                | 850      |
| nupdates           | 1648500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.737    |
| fps                | 850      |
| nupdates           | 1651200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8256000  |
| value_loss         | 5.02e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.89    |
| fps                | 850      |
| nupdates           | 1651300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8256500  |
| value_loss         | 0.00124  |
---------------------------------
---------------------------------
| explained_variance | -3.78    |
| fps                | 850      |
| nupdates           | 1651400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8257000  |
| value_loss         | 0.000141 |
---------------------------------
---------------------------------
| explained_variance | -332     |
| fps                | 850      |
| nupdates           | 1651500  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.927    |
| fps                | 851      |
| nupdates           | 1654300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8271500  |
| value_loss         | 6.78e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.899    |
| fps                | 851      |
| nupdates           | 1654400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8272000  |
| value_loss         | 1.69e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.4     |
| fps                | 851      |
| nupdates           | 1654500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8272500  |
| value_loss         | 0.00077  |
---------------------------------
---------------------------------
| explained_variance | -21.5    |
| fps                | 851      |
| nupdates           | 1654600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.152   |
| fps                | 851      |
| nupdates           | 1657300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8286500  |
| value_loss         | 0.000367 |
---------------------------------
---------------------------------
| explained_variance | 0.219    |
| fps                | 851      |
| nupdates           | 1657400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8287000  |
| value_loss         | 0.141    |
---------------------------------
---------------------------------
| explained_variance | 0.752    |
| fps                | 851      |
| nupdates           | 1657500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8287500  |
| value_loss         | 0.000136 |
---------------------------------
---------------------------------
| explained_variance | -12.6    |
| fps                | 851      |
| nupdates           | 1657600  |
| policy_entropy     | 1.55     |
| total_timest

---------------------------------
| explained_variance | -0.814   |
| fps                | 850      |
| nupdates           | 1660300  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8301500  |
| value_loss         | 0.00011  |
---------------------------------
---------------------------------
| explained_variance | 0.601    |
| fps                | 851      |
| nupdates           | 1660400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8302000  |
| value_loss         | 2.21e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.359   |
| fps                | 851      |
| nupdates           | 1660500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8302500  |
| value_loss         | 0.000348 |
---------------------------------
---------------------------------
| explained_variance | 0.162    |
| fps                | 851      |
| nupdates           | 1660600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.493    |
| fps                | 851      |
| nupdates           | 1663400  |
| policy_entropy     | 1.4      |
| total_timesteps    | 8317000  |
| value_loss         | 0.00117  |
---------------------------------
---------------------------------
| explained_variance | 0.965    |
| fps                | 851      |
| nupdates           | 1663500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8317500  |
| value_loss         | 7.36e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.177    |
| fps                | 851      |
| nupdates           | 1663600  |
| policy_entropy     | 2.02     |
| total_timesteps    | 8318000  |
| value_loss         | 0.00133  |
---------------------------------
---------------------------------
| explained_variance | 0.371    |
| fps                | 851      |
| nupdates           | 1663700  |
| policy_entropy     | 0.72     |
| total_timest

---------------------------------
| explained_variance | -4.01    |
| fps                | 851      |
| nupdates           | 1666400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8332000  |
| value_loss         | 0.000317 |
---------------------------------
----------------------------------
| explained_variance | -1.03e+03 |
| fps                | 851       |
| nupdates           | 1666500   |
| policy_entropy     | 2.06      |
| total_timesteps    | 8332500   |
| value_loss         | 0.0798    |
----------------------------------
---------------------------------
| explained_variance | 0.871    |
| fps                | 851      |
| nupdates           | 1666600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8333000  |
| value_loss         | 8.58e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.824    |
| fps                | 851      |
| nupdates           | 1666700  |
| policy_entropy     | 2.08     |
| tota

---------------------------------
| explained_variance | -0.355   |
| fps                | 851      |
| nupdates           | 1669500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8347500  |
| value_loss         | 0.000915 |
---------------------------------
---------------------------------
| explained_variance | 0.859    |
| fps                | 851      |
| nupdates           | 1669600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8348000  |
| value_loss         | 5.11e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.954    |
| fps                | 851      |
| nupdates           | 1669700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8348500  |
| value_loss         | 3.04e-05 |
---------------------------------
---------------------------------
| explained_variance | -5.72    |
| fps                | 851      |
| nupdates           | 1669800  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.508    |
| fps                | 851      |
| nupdates           | 1672500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8362500  |
| value_loss         | 0.000251 |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 851      |
| nupdates           | 1672600  |
| policy_entropy     | 2.01     |
| total_timesteps    | 8363000  |
| value_loss         | 1.12e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0191  |
| fps                | 851      |
| nupdates           | 1672700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8363500  |
| value_loss         | 0.000301 |
---------------------------------
---------------------------------
| explained_variance | 0.112    |
| fps                | 851      |
| nupdates           | 1672800  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -18.1    |
| fps                | 851      |
| nupdates           | 1675500  |
| policy_entropy     | 1.97     |
| total_timesteps    | 8377500  |
| value_loss         | 0.00462  |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 851      |
| nupdates           | 1675600  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8378000  |
| value_loss         | 1.81e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 851      |
| nupdates           | 1675700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8378500  |
| value_loss         | 7.11e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.947    |
| fps                | 851      |
| nupdates           | 1675800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.973    |
| fps                | 851      |
| nupdates           | 1678600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8393000  |
| value_loss         | 1.98e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.365    |
| fps                | 851      |
| nupdates           | 1678700  |
| policy_entropy     | 1.86     |
| total_timesteps    | 8393500  |
| value_loss         | 0.151    |
---------------------------------
---------------------------------
| explained_variance | 0.629    |
| fps                | 851      |
| nupdates           | 1678800  |
| policy_entropy     | 1.62     |
| total_timesteps    | 8394000  |
| value_loss         | 0.000707 |
---------------------------------
---------------------------------
| explained_variance | 0.949    |
| fps                | 851      |
| nupdates           | 1678900  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.993    |
| fps                | 851      |
| nupdates           | 1681600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8408000  |
| value_loss         | 4.06e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.924    |
| fps                | 851      |
| nupdates           | 1681700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8408500  |
| value_loss         | 6.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.935    |
| fps                | 851      |
| nupdates           | 1681800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8409000  |
| value_loss         | 8.63e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.973    |
| fps                | 851      |
| nupdates           | 1681900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.674    |
| fps                | 851      |
| nupdates           | 1684700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8423500  |
| value_loss         | 4.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.25    |
| fps                | 851      |
| nupdates           | 1684800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8424000  |
| value_loss         | 0.000927 |
---------------------------------
---------------------------------
| explained_variance | 0.809    |
| fps                | 851      |
| nupdates           | 1684900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8424500  |
| value_loss         | 0.000357 |
---------------------------------
Eval num_timesteps=8425000, episode_reward=-5.00 +/- 0.00
Episode length: 595.10 +/- 161.52
---------------------------------
| explained_variance | -0.794   |
| fps                | 8

---------------------------------
| explained_variance | -0.697   |
| fps                | 851      |
| nupdates           | 1687700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8438500  |
| value_loss         | 8.41e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.421   |
| fps                | 851      |
| nupdates           | 1687800  |
| policy_entropy     | 1.74     |
| total_timesteps    | 8439000  |
| value_loss         | 0.000272 |
---------------------------------
---------------------------------
| explained_variance | -0.00163 |
| fps                | 851      |
| nupdates           | 1687900  |
| policy_entropy     | 1.94     |
| total_timesteps    | 8439500  |
| value_loss         | 0.155    |
---------------------------------
---------------------------------
| explained_variance | 0.0369   |
| fps                | 851      |
| nupdates           | 1688000  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.01    |
| fps                | 851      |
| nupdates           | 1690700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8453500  |
| value_loss         | 0.000134 |
---------------------------------
---------------------------------
| explained_variance | 0.625    |
| fps                | 851      |
| nupdates           | 1690800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8454000  |
| value_loss         | 0.000201 |
---------------------------------
---------------------------------
| explained_variance | -6.3     |
| fps                | 851      |
| nupdates           | 1690900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8454500  |
| value_loss         | 0.00438  |
---------------------------------
---------------------------------
| explained_variance | -5.13    |
| fps                | 851      |
| nupdates           | 1691000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.678    |
| fps                | 851      |
| nupdates           | 1693800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8469000  |
| value_loss         | 1.79e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.838    |
| fps                | 851      |
| nupdates           | 1693900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8469500  |
| value_loss         | 0.00113  |
---------------------------------
---------------------------------
| explained_variance | 0.837    |
| fps                | 851      |
| nupdates           | 1694000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8470000  |
| value_loss         | 1.05e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.961    |
| fps                | 851      |
| nupdates           | 1694100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.321    |
| fps                | 851      |
| nupdates           | 1696800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8484000  |
| value_loss         | 3.89e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 851      |
| nupdates           | 1696900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8484500  |
| value_loss         | 1.58e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.678    |
| fps                | 851      |
| nupdates           | 1697000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8485000  |
| value_loss         | 1.5e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.496   |
| fps                | 851      |
| nupdates           | 1697100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -6.17    |
| fps                | 851      |
| nupdates           | 1699900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8499500  |
| value_loss         | 0.000202 |
---------------------------------
Eval num_timesteps=8500000, episode_reward=-4.90 +/- 0.30
Episode length: 607.00 +/- 127.90
---------------------------------
| explained_variance | -1.07    |
| fps                | 851      |
| nupdates           | 1700000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8500000  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | 0.893    |
| fps                | 851      |
| nupdates           | 1700100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8500500  |
| value_loss         | 0.000146 |
---------------------------------
---------------------------------
| explained_variance | 0.694    |
| fps                | 8

---------------------------------
| explained_variance | -0.293   |
| fps                | 851      |
| nupdates           | 1702900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8514500  |
| value_loss         | 0.000442 |
---------------------------------
---------------------------------
| explained_variance | -46.6    |
| fps                | 851      |
| nupdates           | 1703000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8515000  |
| value_loss         | 0.00217  |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 851      |
| nupdates           | 1703100  |
| policy_entropy     | 2.02     |
| total_timesteps    | 8515500  |
| value_loss         | 1.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.78     |
| fps                | 851      |
| nupdates           | 1703200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.946    |
| fps                | 851      |
| nupdates           | 1705900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8529500  |
| value_loss         | 9.72e-06 |
---------------------------------
---------------------------------
| explained_variance | -2.13    |
| fps                | 851      |
| nupdates           | 1706000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8530000  |
| value_loss         | 0.00055  |
---------------------------------
---------------------------------
| explained_variance | 0.879    |
| fps                | 851      |
| nupdates           | 1706100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8530500  |
| value_loss         | 3.78e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.91    |
| fps                | 851      |
| nupdates           | 1706200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.37    |
| fps                | 851      |
| nupdates           | 1709000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8545000  |
| value_loss         | 0.000492 |
---------------------------------
---------------------------------
| explained_variance | 0.19     |
| fps                | 851      |
| nupdates           | 1709100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8545500  |
| value_loss         | 6.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.33     |
| fps                | 851      |
| nupdates           | 1709200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8546000  |
| value_loss         | 2.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.871    |
| fps                | 851      |
| nupdates           | 1709300  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.438    |
| fps                | 851      |
| nupdates           | 1712000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8560000  |
| value_loss         | 0.000117 |
---------------------------------
---------------------------------
| explained_variance | 0.982    |
| fps                | 851      |
| nupdates           | 1712100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8560500  |
| value_loss         | 4.04e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.05    |
| fps                | 851      |
| nupdates           | 1712200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8561000  |
| value_loss         | 0.00013  |
---------------------------------
---------------------------------
| explained_variance | 0.902    |
| fps                | 851      |
| nupdates           | 1712300  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -4.31    |
| fps                | 851      |
| nupdates           | 1715100  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8575500  |
| value_loss         | 0.0012   |
---------------------------------
---------------------------------
| explained_variance | 0.975    |
| fps                | 851      |
| nupdates           | 1715200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8576000  |
| value_loss         | 5.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.59     |
| fps                | 851      |
| nupdates           | 1715300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8576500  |
| value_loss         | 0.000155 |
---------------------------------
---------------------------------
| explained_variance | 0.93     |
| fps                | 851      |
| nupdates           | 1715400  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.00285 |
| fps                | 851      |
| nupdates           | 1718200  |
| policy_entropy     | 1.99     |
| total_timesteps    | 8591000  |
| value_loss         | 0.22     |
---------------------------------
---------------------------------
| explained_variance | -37.4    |
| fps                | 851      |
| nupdates           | 1718300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8591500  |
| value_loss         | 0.00367  |
---------------------------------
---------------------------------
| explained_variance | 0.838    |
| fps                | 851      |
| nupdates           | 1718400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8592000  |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | -3.66    |
| fps                | 851      |
| nupdates           | 1718500  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -3.21    |
| fps                | 851      |
| nupdates           | 1721200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8606000  |
| value_loss         | 0.00117  |
---------------------------------
---------------------------------
| explained_variance | 0.252    |
| fps                | 851      |
| nupdates           | 1721300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8606500  |
| value_loss         | 0.000151 |
---------------------------------
---------------------------------
| explained_variance | 0.922    |
| fps                | 851      |
| nupdates           | 1721400  |
| policy_entropy     | 1.99     |
| total_timesteps    | 8607000  |
| value_loss         | 0.000192 |
---------------------------------
---------------------------------
| explained_variance | -0.554   |
| fps                | 851      |
| nupdates           | 1721500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.66    |
| fps                | 851      |
| nupdates           | 1724300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8621500  |
| value_loss         | 0.000177 |
---------------------------------
---------------------------------
| explained_variance | -62.4    |
| fps                | 851      |
| nupdates           | 1724400  |
| policy_entropy     | 2        |
| total_timesteps    | 8622000  |
| value_loss         | 0.0096   |
---------------------------------
---------------------------------
| explained_variance | 0.118    |
| fps                | 851      |
| nupdates           | 1724500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8622500  |
| value_loss         | 0.000282 |
---------------------------------
---------------------------------
| explained_variance | -0.795   |
| fps                | 851      |
| nupdates           | 1724600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.958    |
| fps                | 851      |
| nupdates           | 1727300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8636500  |
| value_loss         | 7.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.786    |
| fps                | 851      |
| nupdates           | 1727400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8637000  |
| value_loss         | 0.000152 |
---------------------------------
---------------------------------
| explained_variance | 0.827    |
| fps                | 851      |
| nupdates           | 1727500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8637500  |
| value_loss         | 0.000127 |
---------------------------------
---------------------------------
| explained_variance | 0.348    |
| fps                | 851      |
| nupdates           | 1727600  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.617    |
| fps                | 851      |
| nupdates           | 1730300  |
| policy_entropy     | 2.01     |
| total_timesteps    | 8651500  |
| value_loss         | 0.00053  |
---------------------------------
---------------------------------
| explained_variance | -50.6    |
| fps                | 851      |
| nupdates           | 1730400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8652000  |
| value_loss         | 0.000859 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 851      |
| nupdates           | 1730500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8652500  |
| value_loss         | 4.12e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.899    |
| fps                | 851      |
| nupdates           | 1730600  |
| policy_entropy     | 1.94     |
| total_timest

---------------------------------
| explained_variance | 0.878    |
| fps                | 851      |
| nupdates           | 1733400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8667000  |
| value_loss         | 0.000154 |
---------------------------------
---------------------------------
| explained_variance | 0.268    |
| fps                | 851      |
| nupdates           | 1733500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8667500  |
| value_loss         | 0.000716 |
---------------------------------
---------------------------------
| explained_variance | 0.255    |
| fps                | 851      |
| nupdates           | 1733600  |
| policy_entropy     | 2        |
| total_timesteps    | 8668000  |
| value_loss         | 0.00304  |
---------------------------------
---------------------------------
| explained_variance | 0.655    |
| fps                | 851      |
| nupdates           | 1733700  |
| policy_entropy     | 1.93     |
| total_timest

---------------------------------
| explained_variance | 0.715    |
| fps                | 851      |
| nupdates           | 1736400  |
| policy_entropy     | 1.8      |
| total_timesteps    | 8682000  |
| value_loss         | 0.000368 |
---------------------------------
----------------------------------
| explained_variance | -0.000319 |
| fps                | 851       |
| nupdates           | 1736500   |
| policy_entropy     | 1.85      |
| total_timesteps    | 8682500   |
| value_loss         | 0.00104   |
----------------------------------
---------------------------------
| explained_variance | -0.255   |
| fps                | 851      |
| nupdates           | 1736600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8683000  |
| value_loss         | 9.69e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.517    |
| fps                | 851      |
| nupdates           | 1736700  |
| policy_entropy     | 2.07     |
| tota

---------------------------------
| explained_variance | -0.0186  |
| fps                | 852      |
| nupdates           | 1739500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8697500  |
| value_loss         | 0.323    |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 852      |
| nupdates           | 1739600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8698000  |
| value_loss         | 4.57e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.663    |
| fps                | 852      |
| nupdates           | 1739700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8698500  |
| value_loss         | 6.93e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.08    |
| fps                | 852      |
| nupdates           | 1739800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -45.2    |
| fps                | 851      |
| nupdates           | 1742500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8712500  |
| value_loss         | 0.00198  |
---------------------------------
---------------------------------
| explained_variance | 0.976    |
| fps                | 851      |
| nupdates           | 1742600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8713000  |
| value_loss         | 1.78e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.382    |
| fps                | 851      |
| nupdates           | 1742700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8713500  |
| value_loss         | 0.000527 |
---------------------------------
---------------------------------
| explained_variance | 0.831    |
| fps                | 851      |
| nupdates           | 1742800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -3.34    |
| fps                | 851      |
| nupdates           | 1745500  |
| policy_entropy     | 1.96     |
| total_timesteps    | 8727500  |
| value_loss         | 0.00314  |
---------------------------------
---------------------------------
| explained_variance | -0.212   |
| fps                | 851      |
| nupdates           | 1745600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8728000  |
| value_loss         | 0.000156 |
---------------------------------
---------------------------------
| explained_variance | 0.464    |
| fps                | 851      |
| nupdates           | 1745700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8728500  |
| value_loss         | 0.000164 |
---------------------------------
---------------------------------
| explained_variance | 0.71     |
| fps                | 851      |
| nupdates           | 1745800  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.09    |
| fps                | 852      |
| nupdates           | 1748600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8743000  |
| value_loss         | 0.000695 |
---------------------------------
---------------------------------
| explained_variance | 0.374    |
| fps                | 852      |
| nupdates           | 1748700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8743500  |
| value_loss         | 3.37e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 852      |
| nupdates           | 1748800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8744000  |
| value_loss         | 1.37e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.317   |
| fps                | 852      |
| nupdates           | 1748900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.992    |
| fps                | 852      |
| nupdates           | 1751600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8758000  |
| value_loss         | 9.65e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.978    |
| fps                | 852      |
| nupdates           | 1751700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8758500  |
| value_loss         | 5.26e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.878    |
| fps                | 852      |
| nupdates           | 1751800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8759000  |
| value_loss         | 2.84e-06 |
---------------------------------
---------------------------------
| explained_variance | -21.4    |
| fps                | 852      |
| nupdates           | 1751900  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.595    |
| fps                | 852      |
| nupdates           | 1754700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8773500  |
| value_loss         | 0.000233 |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 852      |
| nupdates           | 1754800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8774000  |
| value_loss         | 6.03e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.945    |
| fps                | 852      |
| nupdates           | 1754900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8774500  |
| value_loss         | 4.53e-05 |
---------------------------------
Eval num_timesteps=8775000, episode_reward=-4.60 +/- 0.80
Episode length: 657.80 +/- 141.53
---------------------------------
| explained_variance | 0.351    |
| fps                | 8

---------------------------------
| explained_variance | 0.976    |
| fps                | 852      |
| nupdates           | 1757700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8788500  |
| value_loss         | 1.31e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.952    |
| fps                | 852      |
| nupdates           | 1757800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8789000  |
| value_loss         | 3.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.546    |
| fps                | 852      |
| nupdates           | 1757900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8789500  |
| value_loss         | 3.67e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.041    |
| fps                | 852      |
| nupdates           | 1758000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.929    |
| fps                | 852      |
| nupdates           | 1760700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8803500  |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | 0.435    |
| fps                | 852      |
| nupdates           | 1760800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8804000  |
| value_loss         | 6.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.821    |
| fps                | 852      |
| nupdates           | 1760900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8804500  |
| value_loss         | 0.000278 |
---------------------------------
---------------------------------
| explained_variance | 0.0819   |
| fps                | 852      |
| nupdates           | 1761000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.948    |
| fps                | 852      |
| nupdates           | 1763800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8819000  |
| value_loss         | 7.48e-06 |
---------------------------------
---------------------------------
| explained_variance | -40.8    |
| fps                | 852      |
| nupdates           | 1763900  |
| policy_entropy     | 1.89     |
| total_timesteps    | 8819500  |
| value_loss         | 0.121    |
---------------------------------
---------------------------------
| explained_variance | 0.748    |
| fps                | 852      |
| nupdates           | 1764000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8820000  |
| value_loss         | 1.28e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.743    |
| fps                | 852      |
| nupdates           | 1764100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.628    |
| fps                | 852      |
| nupdates           | 1766800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8834000  |
| value_loss         | 4.64e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.691   |
| fps                | 852      |
| nupdates           | 1766900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8834500  |
| value_loss         | 0.00058  |
---------------------------------
---------------------------------
| explained_variance | -6.72    |
| fps                | 852      |
| nupdates           | 1767000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8835000  |
| value_loss         | 0.00013  |
---------------------------------
---------------------------------
| explained_variance | 0.118    |
| fps                | 852      |
| nupdates           | 1767100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.147   |
| fps                | 852      |
| nupdates           | 1769900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8849500  |
| value_loss         | 0.00483  |
---------------------------------
Eval num_timesteps=8850000, episode_reward=-4.80 +/- 0.40
Episode length: 637.20 +/- 149.35
---------------------------------
| explained_variance | 0.775    |
| fps                | 852      |
| nupdates           | 1770000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8850000  |
| value_loss         | 3.32e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.807    |
| fps                | 852      |
| nupdates           | 1770100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8850500  |
| value_loss         | 1.08e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.87    |
| fps                | 8

---------------------------------
| explained_variance | 0.427    |
| fps                | 852      |
| nupdates           | 1772900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8864500  |
| value_loss         | 5.39e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.783    |
| fps                | 852      |
| nupdates           | 1773000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8865000  |
| value_loss         | 1.69e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.909    |
| fps                | 852      |
| nupdates           | 1773100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 8865500  |
| value_loss         | 4.11e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.151   |
| fps                | 852      |
| nupdates           | 1773200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.982    |
| fps                | 852      |
| nupdates           | 1775900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8879500  |
| value_loss         | 3.46e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.884    |
| fps                | 852      |
| nupdates           | 1776000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8880000  |
| value_loss         | 2.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.851    |
| fps                | 852      |
| nupdates           | 1776100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8880500  |
| value_loss         | 0.000215 |
---------------------------------
---------------------------------
| explained_variance | 0.737    |
| fps                | 852      |
| nupdates           | 1776200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.29    |
| fps                | 852      |
| nupdates           | 1779000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8895000  |
| value_loss         | 0.000388 |
---------------------------------
---------------------------------
| explained_variance | 0.968    |
| fps                | 852      |
| nupdates           | 1779100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8895500  |
| value_loss         | 4.07e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.68    |
| fps                | 852      |
| nupdates           | 1779200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8896000  |
| value_loss         | 1.64e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.544    |
| fps                | 852      |
| nupdates           | 1779300  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.956    |
| fps                | 852      |
| nupdates           | 1782000  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8910000  |
| value_loss         | 0.000139 |
---------------------------------
---------------------------------
| explained_variance | 0.301    |
| fps                | 852      |
| nupdates           | 1782100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8910500  |
| value_loss         | 9.19e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.587    |
| fps                | 852      |
| nupdates           | 1782200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8911000  |
| value_loss         | 0.000194 |
---------------------------------
---------------------------------
| explained_variance | 0.948    |
| fps                | 852      |
| nupdates           | 1782300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.308    |
| fps                | 852      |
| nupdates           | 1785100  |
| policy_entropy     | 2        |
| total_timesteps    | 8925500  |
| value_loss         | 0.000123 |
---------------------------------
---------------------------------
| explained_variance | 0.761    |
| fps                | 852      |
| nupdates           | 1785200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 8926000  |
| value_loss         | 1.07e-05 |
---------------------------------
---------------------------------
| explained_variance | -13.1    |
| fps                | 852      |
| nupdates           | 1785300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8926500  |
| value_loss         | 0.000157 |
---------------------------------
---------------------------------
| explained_variance | -0.55    |
| fps                | 852      |
| nupdates           | 1785400  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.895    |
| fps                | 852      |
| nupdates           | 1788200  |
| policy_entropy     | 2.02     |
| total_timesteps    | 8941000  |
| value_loss         | 1.54e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.405   |
| fps                | 852      |
| nupdates           | 1788300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 8941500  |
| value_loss         | 0.00102  |
---------------------------------
---------------------------------
| explained_variance | 0.341    |
| fps                | 852      |
| nupdates           | 1788400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8942000  |
| value_loss         | 0.000217 |
---------------------------------
---------------------------------
| explained_variance | 0.99     |
| fps                | 852      |
| nupdates           | 1788500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.122    |
| fps                | 852      |
| nupdates           | 1791200  |
| policy_entropy     | 1.86     |
| total_timesteps    | 8956000  |
| value_loss         | 0.903    |
---------------------------------
---------------------------------
| explained_variance | 0.917    |
| fps                | 852      |
| nupdates           | 1791300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8956500  |
| value_loss         | 1.16e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.121    |
| fps                | 852      |
| nupdates           | 1791400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8957000  |
| value_loss         | 3.55e-05 |
---------------------------------
---------------------------------
| explained_variance | -12.6    |
| fps                | 852      |
| nupdates           | 1791500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.0886   |
| fps                | 852      |
| nupdates           | 1794300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8971500  |
| value_loss         | 0.00525  |
---------------------------------
---------------------------------
| explained_variance | 0.744    |
| fps                | 853      |
| nupdates           | 1794400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8972000  |
| value_loss         | 2.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.158    |
| fps                | 853      |
| nupdates           | 1794500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 8972500  |
| value_loss         | 3.77e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.455    |
| fps                | 853      |
| nupdates           | 1794600  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.922    |
| fps                | 852      |
| nupdates           | 1797300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8986500  |
| value_loss         | 0.000127 |
---------------------------------
---------------------------------
| explained_variance | -1.05    |
| fps                | 852      |
| nupdates           | 1797400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 8987000  |
| value_loss         | 0.000102 |
---------------------------------
---------------------------------
| explained_variance | 0.47     |
| fps                | 852      |
| nupdates           | 1797500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 8987500  |
| value_loss         | 6.08e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.08    |
| fps                | 852      |
| nupdates           | 1797600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.494    |
| fps                | 852      |
| nupdates           | 1800300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9001500  |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | 0.672    |
| fps                | 852      |
| nupdates           | 1800400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9002000  |
| value_loss         | 0.000209 |
---------------------------------
---------------------------------
| explained_variance | 0.776    |
| fps                | 852      |
| nupdates           | 1800500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9002500  |
| value_loss         | 2.45e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.727    |
| fps                | 852      |
| nupdates           | 1800600  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.97    |
| fps                | 852      |
| nupdates           | 1803400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9017000  |
| value_loss         | 0.000562 |
---------------------------------
---------------------------------
| explained_variance | -5.22    |
| fps                | 852      |
| nupdates           | 1803500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9017500  |
| value_loss         | 0.00897  |
---------------------------------
---------------------------------
| explained_variance | 0.813    |
| fps                | 852      |
| nupdates           | 1803600  |
| policy_entropy     | 2.02     |
| total_timesteps    | 9018000  |
| value_loss         | 9.58e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.672    |
| fps                | 852      |
| nupdates           | 1803700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.354   |
| fps                | 852      |
| nupdates           | 1806400  |
| policy_entropy     | 1.98     |
| total_timesteps    | 9032000  |
| value_loss         | 0.000544 |
---------------------------------
---------------------------------
| explained_variance | -0.717   |
| fps                | 852      |
| nupdates           | 1806500  |
| policy_entropy     | 2.02     |
| total_timesteps    | 9032500  |
| value_loss         | 0.000541 |
---------------------------------
---------------------------------
| explained_variance | 0.969    |
| fps                | 852      |
| nupdates           | 1806600  |
| policy_entropy     | 2.02     |
| total_timesteps    | 9033000  |
| value_loss         | 8.83e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.164    |
| fps                | 852      |
| nupdates           | 1806700  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.795    |
| fps                | 852      |
| nupdates           | 1809500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9047500  |
| value_loss         | 1.91e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.763    |
| fps                | 852      |
| nupdates           | 1809600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9048000  |
| value_loss         | 1.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.647    |
| fps                | 852      |
| nupdates           | 1809700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9048500  |
| value_loss         | 4.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.762    |
| fps                | 852      |
| nupdates           | 1809800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.874    |
| fps                | 852      |
| nupdates           | 1812500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9062500  |
| value_loss         | 3.91e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.879    |
| fps                | 852      |
| nupdates           | 1812600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9063000  |
| value_loss         | 5.34e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0179  |
| fps                | 852      |
| nupdates           | 1812700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9063500  |
| value_loss         | 0.000551 |
---------------------------------
---------------------------------
| explained_variance | 0.383    |
| fps                | 852      |
| nupdates           | 1812800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -2.71    |
| fps                | 852      |
| nupdates           | 1815500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9077500  |
| value_loss         | 7.18e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.56    |
| fps                | 852      |
| nupdates           | 1815600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9078000  |
| value_loss         | 2.29e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.614    |
| fps                | 852      |
| nupdates           | 1815700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9078500  |
| value_loss         | 3.43e-05 |
---------------------------------
---------------------------------
| explained_variance | -100     |
| fps                | 853      |
| nupdates           | 1815800  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -1.38    |
| fps                | 853      |
| nupdates           | 1818600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9093000  |
| value_loss         | 0.000458 |
---------------------------------
---------------------------------
| explained_variance | 0.901    |
| fps                | 853      |
| nupdates           | 1818700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9093500  |
| value_loss         | 6.51e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0011   |
| fps                | 853      |
| nupdates           | 1818800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9094000  |
| value_loss         | 3.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.414    |
| fps                | 853      |
| nupdates           | 1818900  |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.191    |
| fps                | 853      |
| nupdates           | 1821600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9108000  |
| value_loss         | 8.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 853      |
| nupdates           | 1821700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9108500  |
| value_loss         | 6.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.659    |
| fps                | 853      |
| nupdates           | 1821800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9109000  |
| value_loss         | 9.71e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.666    |
| fps                | 853      |
| nupdates           | 1821900  |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.974    |
| fps                | 853      |
| nupdates           | 1824700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9123500  |
| value_loss         | 5.73e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 853      |
| nupdates           | 1824800  |
| policy_entropy     | 0.997    |
| total_timesteps    | 9124000  |
| value_loss         | 0.0075   |
---------------------------------
---------------------------------
| explained_variance | -1.23    |
| fps                | 853      |
| nupdates           | 1824900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9124500  |
| value_loss         | 5.88e-05 |
---------------------------------
Eval num_timesteps=9125000, episode_reward=-4.90 +/- 0.30
Episode length: 564.40 +/- 100.37
---------------------------------
| explained_variance | 0.943    |
| fps                | 8

---------------------------------
| explained_variance | 0.74     |
| fps                | 853      |
| nupdates           | 1827700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9138500  |
| value_loss         | 3.34e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.777    |
| fps                | 853      |
| nupdates           | 1827800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9139000  |
| value_loss         | 4.69e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.147    |
| fps                | 853      |
| nupdates           | 1827900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9139500  |
| value_loss         | 8.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 853      |
| nupdates           | 1828000  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.928    |
| fps                | 853      |
| nupdates           | 1830700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9153500  |
| value_loss         | 0.000724 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 853      |
| nupdates           | 1830800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9154000  |
| value_loss         | 3.82e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.201    |
| fps                | 853      |
| nupdates           | 1830900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9154500  |
| value_loss         | 0.00148  |
---------------------------------
---------------------------------
| explained_variance | -0.605   |
| fps                | 853      |
| nupdates           | 1831000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.223   |
| fps                | 853      |
| nupdates           | 1833800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9169000  |
| value_loss         | 0.000432 |
---------------------------------
---------------------------------
| explained_variance | -0.09    |
| fps                | 853      |
| nupdates           | 1833900  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9169500  |
| value_loss         | 0.000189 |
---------------------------------
---------------------------------
| explained_variance | -8.73    |
| fps                | 853      |
| nupdates           | 1834000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9170000  |
| value_loss         | 0.00139  |
---------------------------------
---------------------------------
| explained_variance | 0.913    |
| fps                | 853      |
| nupdates           | 1834100  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.446   |
| fps                | 853      |
| nupdates           | 1836800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9184000  |
| value_loss         | 0.000417 |
---------------------------------
---------------------------------
| explained_variance | 0.975    |
| fps                | 853      |
| nupdates           | 1836900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9184500  |
| value_loss         | 3.81e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.226   |
| fps                | 853      |
| nupdates           | 1837000  |
| policy_entropy     | 2.02     |
| total_timesteps    | 9185000  |
| value_loss         | 0.000624 |
---------------------------------
---------------------------------
| explained_variance | -3.39    |
| fps                | 853      |
| nupdates           | 1837100  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -3.38    |
| fps                | 854      |
| nupdates           | 1839900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 9199500  |
| value_loss         | 0.000115 |
---------------------------------
Eval num_timesteps=9200000, episode_reward=-4.60 +/- 0.49
Episode length: 594.40 +/- 150.62
---------------------------------
| explained_variance | 0.952    |
| fps                | 853      |
| nupdates           | 1840000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9200000  |
| value_loss         | 0.000362 |
---------------------------------
---------------------------------
| explained_variance | 0.902    |
| fps                | 853      |
| nupdates           | 1840100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9200500  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | -0.351   |
| fps                | 8

---------------------------------
| explained_variance | -2.53    |
| fps                | 854      |
| nupdates           | 1842900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9214500  |
| value_loss         | 0.000285 |
---------------------------------
---------------------------------
| explained_variance | 0.352    |
| fps                | 854      |
| nupdates           | 1843000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9215000  |
| value_loss         | 4.54e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.386    |
| fps                | 854      |
| nupdates           | 1843100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9215500  |
| value_loss         | 0.000584 |
---------------------------------
---------------------------------
| explained_variance | 0.0981   |
| fps                | 854      |
| nupdates           | 1843200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.994    |
| fps                | 853      |
| nupdates           | 1845900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9229500  |
| value_loss         | 1.41e-06 |
---------------------------------
---------------------------------
| explained_variance | -2.25    |
| fps                | 853      |
| nupdates           | 1846000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9230000  |
| value_loss         | 0.000807 |
---------------------------------
---------------------------------
| explained_variance | -2.21    |
| fps                | 853      |
| nupdates           | 1846100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9230500  |
| value_loss         | 7.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.765    |
| fps                | 853      |
| nupdates           | 1846200  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -5.91    |
| fps                | 854      |
| nupdates           | 1849000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9245000  |
| value_loss         | 0.000406 |
---------------------------------
---------------------------------
| explained_variance | 0.0465   |
| fps                | 854      |
| nupdates           | 1849100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9245500  |
| value_loss         | 0.000418 |
---------------------------------
---------------------------------
| explained_variance | 0.604    |
| fps                | 854      |
| nupdates           | 1849200  |
| policy_entropy     | 2.01     |
| total_timesteps    | 9246000  |
| value_loss         | 0.000929 |
---------------------------------
---------------------------------
| explained_variance | 0.969    |
| fps                | 854      |
| nupdates           | 1849300  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.418    |
| fps                | 854      |
| nupdates           | 1852000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9260000  |
| value_loss         | 8.37e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.979    |
| fps                | 854      |
| nupdates           | 1852100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9260500  |
| value_loss         | 5.66e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.878    |
| fps                | 854      |
| nupdates           | 1852200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9261000  |
| value_loss         | 1.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.522    |
| fps                | 854      |
| nupdates           | 1852300  |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.519    |
| fps                | 854      |
| nupdates           | 1855100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9275500  |
| value_loss         | 0.000126 |
---------------------------------
---------------------------------
| explained_variance | -1.96    |
| fps                | 854      |
| nupdates           | 1855200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9276000  |
| value_loss         | 0.000196 |
---------------------------------
---------------------------------
| explained_variance | 0.121    |
| fps                | 854      |
| nupdates           | 1855300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9276500  |
| value_loss         | 0.000123 |
---------------------------------
---------------------------------
| explained_variance | 0.758    |
| fps                | 854      |
| nupdates           | 1855400  |
| policy_entropy     | 1.97     |
| total_timest

---------------------------------
| explained_variance | 0.35     |
| fps                | 854      |
| nupdates           | 1858200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9291000  |
| value_loss         | 0.000332 |
---------------------------------
---------------------------------
| explained_variance | 0.412    |
| fps                | 854      |
| nupdates           | 1858300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9291500  |
| value_loss         | 0.000172 |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 854      |
| nupdates           | 1858400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9292000  |
| value_loss         | 1.91e-06 |
---------------------------------
---------------------------------
| explained_variance | -19.2    |
| fps                | 854      |
| nupdates           | 1858500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.335    |
| fps                | 854      |
| nupdates           | 1861200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9306000  |
| value_loss         | 2.23e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.87    |
| fps                | 854      |
| nupdates           | 1861300  |
| policy_entropy     | 2.01     |
| total_timesteps    | 9306500  |
| value_loss         | 6.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.921    |
| fps                | 854      |
| nupdates           | 1861400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9307000  |
| value_loss         | 2.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.0807   |
| fps                | 854      |
| nupdates           | 1861500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.778    |
| fps                | 854      |
| nupdates           | 1864300  |
| policy_entropy     | 1.94     |
| total_timesteps    | 9321500  |
| value_loss         | 0.000166 |
---------------------------------
---------------------------------
| explained_variance | -1.44    |
| fps                | 854      |
| nupdates           | 1864400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9322000  |
| value_loss         | 0.000405 |
---------------------------------
---------------------------------
| explained_variance | 0.891    |
| fps                | 854      |
| nupdates           | 1864500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9322500  |
| value_loss         | 1.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.883    |
| fps                | 854      |
| nupdates           | 1864600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.999    |
| fps                | 854      |
| nupdates           | 1867300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9336500  |
| value_loss         | 6.15e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.542    |
| fps                | 854      |
| nupdates           | 1867400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9337000  |
| value_loss         | 0.000514 |
---------------------------------
---------------------------------
| explained_variance | 0.503    |
| fps                | 854      |
| nupdates           | 1867500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9337500  |
| value_loss         | 0.000139 |
---------------------------------
---------------------------------
| explained_variance | 0.000495 |
| fps                | 854      |
| nupdates           | 1867600  |
| policy_entropy     | 0.954    |
| total_timest

---------------------------------
| explained_variance | 0.965    |
| fps                | 854      |
| nupdates           | 1870300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9351500  |
| value_loss         | 5.09e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0967   |
| fps                | 854      |
| nupdates           | 1870400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9352000  |
| value_loss         | 0.000315 |
---------------------------------
---------------------------------
| explained_variance | 0.438    |
| fps                | 854      |
| nupdates           | 1870500  |
| policy_entropy     | 1.98     |
| total_timesteps    | 9352500  |
| value_loss         | 0.131    |
---------------------------------
---------------------------------
| explained_variance | -2.37    |
| fps                | 854      |
| nupdates           | 1870600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.992    |
| fps                | 854      |
| nupdates           | 1873400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9367000  |
| value_loss         | 1.74e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.904    |
| fps                | 854      |
| nupdates           | 1873500  |
| policy_entropy     | 2.01     |
| total_timesteps    | 9367500  |
| value_loss         | 0.00102  |
---------------------------------
---------------------------------
| explained_variance | -12      |
| fps                | 854      |
| nupdates           | 1873600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9368000  |
| value_loss         | 0.00107  |
---------------------------------
---------------------------------
| explained_variance | 0.186    |
| fps                | 854      |
| nupdates           | 1873700  |
| policy_entropy     | 1.98     |
| total_timest

---------------------------------
| explained_variance | -1.46    |
| fps                | 854      |
| nupdates           | 1876400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9382000  |
| value_loss         | 7.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.12    |
| fps                | 854      |
| nupdates           | 1876500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9382500  |
| value_loss         | 0.000353 |
---------------------------------
---------------------------------
| explained_variance | 0.158    |
| fps                | 854      |
| nupdates           | 1876600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9383000  |
| value_loss         | 0.000296 |
---------------------------------
---------------------------------
| explained_variance | 0.564    |
| fps                | 854      |
| nupdates           | 1876700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.967    |
| fps                | 854      |
| nupdates           | 1879500  |
| policy_entropy     | 2.03     |
| total_timesteps    | 9397500  |
| value_loss         | 6.21e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.982    |
| fps                | 854      |
| nupdates           | 1879600  |
| policy_entropy     | 2.01     |
| total_timesteps    | 9398000  |
| value_loss         | 2.73e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.968    |
| fps                | 854      |
| nupdates           | 1879700  |
| policy_entropy     | 1.95     |
| total_timesteps    | 9398500  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | -8.27    |
| fps                | 854      |
| nupdates           | 1879800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.668    |
| fps                | 854      |
| nupdates           | 1882500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9412500  |
| value_loss         | 3.24e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.874    |
| fps                | 854      |
| nupdates           | 1882600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9413000  |
| value_loss         | 4.51e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 854      |
| nupdates           | 1882700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9413500  |
| value_loss         | 1.28e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.8     |
| fps                | 854      |
| nupdates           | 1882800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.938    |
| fps                | 853      |
| nupdates           | 1885500  |
| policy_entropy     | 2.01     |
| total_timesteps    | 9427500  |
| value_loss         | 0.000166 |
---------------------------------
---------------------------------
| explained_variance | 0.142    |
| fps                | 853      |
| nupdates           | 1885600  |
| policy_entropy     | 2.01     |
| total_timesteps    | 9428000  |
| value_loss         | 5.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.215    |
| fps                | 853      |
| nupdates           | 1885700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9428500  |
| value_loss         | 4.95e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.47     |
| fps                | 853      |
| nupdates           | 1885800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -4.17    |
| fps                | 854      |
| nupdates           | 1888600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9443000  |
| value_loss         | 0.000589 |
---------------------------------
---------------------------------
| explained_variance | 0.326    |
| fps                | 854      |
| nupdates           | 1888700  |
| policy_entropy     | 1.3      |
| total_timesteps    | 9443500  |
| value_loss         | 0.112    |
---------------------------------
---------------------------------
| explained_variance | 0.896    |
| fps                | 854      |
| nupdates           | 1888800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9444000  |
| value_loss         | 1.51e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.796    |
| fps                | 854      |
| nupdates           | 1888900  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -5.83    |
| fps                | 853      |
| nupdates           | 1891600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9458000  |
| value_loss         | 0.00222  |
---------------------------------
---------------------------------
| explained_variance | -68      |
| fps                | 853      |
| nupdates           | 1891700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9458500  |
| value_loss         | 0.0084   |
---------------------------------
---------------------------------
| explained_variance | 0.679    |
| fps                | 853      |
| nupdates           | 1891800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9459000  |
| value_loss         | 0.000109 |
---------------------------------
---------------------------------
| explained_variance | -0.433   |
| fps                | 853      |
| nupdates           | 1891900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.954    |
| fps                | 854      |
| nupdates           | 1894700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9473500  |
| value_loss         | 3e-05    |
---------------------------------
---------------------------------
| explained_variance | -269     |
| fps                | 854      |
| nupdates           | 1894800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9474000  |
| value_loss         | 0.0913   |
---------------------------------
---------------------------------
| explained_variance | -15.7    |
| fps                | 854      |
| nupdates           | 1894900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9474500  |
| value_loss         | 0.00186  |
---------------------------------
Eval num_timesteps=9475000, episode_reward=-4.80 +/- 0.40
Episode length: 705.60 +/- 94.52
---------------------------------
| explained_variance | 0.492    |
| fps                | 85

---------------------------------
| explained_variance | -0.981   |
| fps                | 853      |
| nupdates           | 1897700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9488500  |
| value_loss         | 0.00112  |
---------------------------------
---------------------------------
| explained_variance | 0.946    |
| fps                | 853      |
| nupdates           | 1897800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9489000  |
| value_loss         | 0.000246 |
---------------------------------
---------------------------------
| explained_variance | -0.00816 |
| fps                | 854      |
| nupdates           | 1897900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 9489500  |
| value_loss         | 0.158    |
---------------------------------
---------------------------------
| explained_variance | 0.671    |
| fps                | 854      |
| nupdates           | 1898000  |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.967    |
| fps                | 853      |
| nupdates           | 1900700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9503500  |
| value_loss         | 5.65e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.117    |
| fps                | 853      |
| nupdates           | 1900800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9504000  |
| value_loss         | 0.000485 |
---------------------------------
---------------------------------
| explained_variance | 0.528    |
| fps                | 853      |
| nupdates           | 1900900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9504500  |
| value_loss         | 2.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.841    |
| fps                | 853      |
| nupdates           | 1901000  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.983    |
| fps                | 854      |
| nupdates           | 1903800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9519000  |
| value_loss         | 2.05e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 854      |
| nupdates           | 1903900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9519500  |
| value_loss         | 0.00182  |
---------------------------------
---------------------------------
| explained_variance | 0.974    |
| fps                | 854      |
| nupdates           | 1904000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9520000  |
| value_loss         | 1.62e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.969    |
| fps                | 854      |
| nupdates           | 1904100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.598    |
| fps                | 854      |
| nupdates           | 1906800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9534000  |
| value_loss         | 2.16e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.863    |
| fps                | 854      |
| nupdates           | 1906900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9534500  |
| value_loss         | 0.000176 |
---------------------------------
---------------------------------
| explained_variance | 0.946    |
| fps                | 854      |
| nupdates           | 1907000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9535000  |
| value_loss         | 2.2e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.754    |
| fps                | 854      |
| nupdates           | 1907100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.829    |
| fps                | 854      |
| nupdates           | 1909900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 9549500  |
| value_loss         | 9.75e-05 |
---------------------------------
Eval num_timesteps=9550000, episode_reward=-4.90 +/- 0.30
Episode length: 644.80 +/- 114.24
---------------------------------
| explained_variance | 0.827    |
| fps                | 853      |
| nupdates           | 1910000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9550000  |
| value_loss         | 1.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.255    |
| fps                | 853      |
| nupdates           | 1910100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9550500  |
| value_loss         | 0.000261 |
---------------------------------
---------------------------------
| explained_variance | 0.0421   |
| fps                | 8

---------------------------------
| explained_variance | 0.79     |
| fps                | 854      |
| nupdates           | 1912900  |
| policy_entropy     | 2.01     |
| total_timesteps    | 9564500  |
| value_loss         | 1.95e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.406    |
| fps                | 854      |
| nupdates           | 1913000  |
| policy_entropy     | 2.01     |
| total_timesteps    | 9565000  |
| value_loss         | 0.000193 |
---------------------------------
----------------------------------
| explained_variance | -6.65e+03 |
| fps                | 854       |
| nupdates           | 1913100   |
| policy_entropy     | 1.99      |
| total_timesteps    | 9565500   |
| value_loss         | 0.112     |
----------------------------------
---------------------------------
| explained_variance | 0.86     |
| fps                | 854      |
| nupdates           | 1913200  |
| policy_entropy     | 2.05     |
| tota

---------------------------------
| explained_variance | 0.718    |
| fps                | 854      |
| nupdates           | 1915900  |
| policy_entropy     | 0.757    |
| total_timesteps    | 9579500  |
| value_loss         | 0.000763 |
---------------------------------
---------------------------------
| explained_variance | 0.962    |
| fps                | 854      |
| nupdates           | 1916000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9580000  |
| value_loss         | 1.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.138    |
| fps                | 854      |
| nupdates           | 1916100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9580500  |
| value_loss         | 0.000192 |
---------------------------------
---------------------------------
| explained_variance | 0.237    |
| fps                | 854      |
| nupdates           | 1916200  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.967    |
| fps                | 854      |
| nupdates           | 1919000  |
| policy_entropy     | 1.92     |
| total_timesteps    | 9595000  |
| value_loss         | 3.23e-05 |
---------------------------------
---------------------------------
| explained_variance | -323     |
| fps                | 854      |
| nupdates           | 1919100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9595500  |
| value_loss         | 0.0267   |
---------------------------------
---------------------------------
| explained_variance | 0.568    |
| fps                | 854      |
| nupdates           | 1919200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9596000  |
| value_loss         | 0.000378 |
---------------------------------
---------------------------------
| explained_variance | -1.27    |
| fps                | 854      |
| nupdates           | 1919300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.32    |
| fps                | 854      |
| nupdates           | 1922000  |
| policy_entropy     | 1.99     |
| total_timesteps    | 9610000  |
| value_loss         | 0.0122   |
---------------------------------
---------------------------------
| explained_variance | 0.205    |
| fps                | 854      |
| nupdates           | 1922100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9610500  |
| value_loss         | 1.19e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.124   |
| fps                | 854      |
| nupdates           | 1922200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9611000  |
| value_loss         | 0.000121 |
---------------------------------
---------------------------------
| explained_variance | -215     |
| fps                | 854      |
| nupdates           | 1922300  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.978    |
| fps                | 854      |
| nupdates           | 1925100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9625500  |
| value_loss         | 5.39e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.547    |
| fps                | 854      |
| nupdates           | 1925200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9626000  |
| value_loss         | 0.000297 |
---------------------------------
---------------------------------
| explained_variance | 0.329    |
| fps                | 854      |
| nupdates           | 1925300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9626500  |
| value_loss         | 8.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.94     |
| fps                | 854      |
| nupdates           | 1925400  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.549    |
| fps                | 854      |
| nupdates           | 1928200  |
| policy_entropy     | 2.03     |
| total_timesteps    | 9641000  |
| value_loss         | 6.38e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.38    |
| fps                | 854      |
| nupdates           | 1928300  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9641500  |
| value_loss         | 0.00254  |
---------------------------------
---------------------------------
| explained_variance | -3.24    |
| fps                | 854      |
| nupdates           | 1928400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9642000  |
| value_loss         | 0.000444 |
---------------------------------
---------------------------------
| explained_variance | 0.593    |
| fps                | 854      |
| nupdates           | 1928500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.566    |
| fps                | 854      |
| nupdates           | 1931200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9656000  |
| value_loss         | 0.000205 |
---------------------------------
---------------------------------
| explained_variance | -47.4    |
| fps                | 854      |
| nupdates           | 1931300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9656500  |
| value_loss         | 0.00484  |
---------------------------------
---------------------------------
| explained_variance | 0.164    |
| fps                | 854      |
| nupdates           | 1931400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9657000  |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | 0.423    |
| fps                | 854      |
| nupdates           | 1931500  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.916    |
| fps                | 854      |
| nupdates           | 1934300  |
| policy_entropy     | 1.96     |
| total_timesteps    | 9671500  |
| value_loss         | 0.0001   |
---------------------------------
---------------------------------
| explained_variance | -0.905   |
| fps                | 854      |
| nupdates           | 1934400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9672000  |
| value_loss         | 0.000144 |
---------------------------------
---------------------------------
| explained_variance | 0.168    |
| fps                | 854      |
| nupdates           | 1934500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9672500  |
| value_loss         | 4.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.375    |
| fps                | 854      |
| nupdates           | 1934600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.715    |
| fps                | 854      |
| nupdates           | 1937300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9686500  |
| value_loss         | 0.000218 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 854      |
| nupdates           | 1937400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9687000  |
| value_loss         | 3.27e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0669   |
| fps                | 854      |
| nupdates           | 1937500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9687500  |
| value_loss         | 0.000287 |
---------------------------------
---------------------------------
| explained_variance | 0.965    |
| fps                | 854      |
| nupdates           | 1937600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -9.3     |
| fps                | 854      |
| nupdates           | 1940300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 9701500  |
| value_loss         | 0.000292 |
---------------------------------
---------------------------------
| explained_variance | -4.06    |
| fps                | 854      |
| nupdates           | 1940400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9702000  |
| value_loss         | 6.4e-05  |
---------------------------------
---------------------------------
| explained_variance | -3.56    |
| fps                | 854      |
| nupdates           | 1940500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9702500  |
| value_loss         | 0.000545 |
---------------------------------
---------------------------------
| explained_variance | -0.0618  |
| fps                | 854      |
| nupdates           | 1940600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.578    |
| fps                | 854      |
| nupdates           | 1943400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9717000  |
| value_loss         | 0.000125 |
---------------------------------
---------------------------------
| explained_variance | -47.4    |
| fps                | 854      |
| nupdates           | 1943500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9717500  |
| value_loss         | 0.0283   |
---------------------------------
---------------------------------
| explained_variance | 0.824    |
| fps                | 854      |
| nupdates           | 1943600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9718000  |
| value_loss         | 5.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0943   |
| fps                | 854      |
| nupdates           | 1943700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.484   |
| fps                | 854      |
| nupdates           | 1946400  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9732000  |
| value_loss         | 0.00089  |
---------------------------------
---------------------------------
| explained_variance | -0.315   |
| fps                | 854      |
| nupdates           | 1946500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9732500  |
| value_loss         | 0.000353 |
---------------------------------
---------------------------------
| explained_variance | 0.652    |
| fps                | 854      |
| nupdates           | 1946600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9733000  |
| value_loss         | 0.000163 |
---------------------------------
---------------------------------
| explained_variance | -0.112   |
| fps                | 854      |
| nupdates           | 1946700  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.48    |
| fps                | 854      |
| nupdates           | 1949500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9747500  |
| value_loss         | 0.000186 |
---------------------------------
---------------------------------
| explained_variance | 0.722    |
| fps                | 854      |
| nupdates           | 1949600  |
| policy_entropy     | 1.99     |
| total_timesteps    | 9748000  |
| value_loss         | 9.35e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.584    |
| fps                | 854      |
| nupdates           | 1949700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9748500  |
| value_loss         | 0.00012  |
---------------------------------
---------------------------------
| explained_variance | 0.976    |
| fps                | 854      |
| nupdates           | 1949800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.04    |
| fps                | 854      |
| nupdates           | 1952500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9762500  |
| value_loss         | 0.000141 |
---------------------------------
---------------------------------
| explained_variance | 0.0813   |
| fps                | 854      |
| nupdates           | 1952600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9763000  |
| value_loss         | 0.000242 |
---------------------------------
---------------------------------
| explained_variance | 0.384    |
| fps                | 854      |
| nupdates           | 1952700  |
| policy_entropy     | 1.98     |
| total_timesteps    | 9763500  |
| value_loss         | 0.000296 |
---------------------------------
---------------------------------
| explained_variance | 0.873    |
| fps                | 854      |
| nupdates           | 1952800  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.625    |
| fps                | 853      |
| nupdates           | 1955500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9777500  |
| value_loss         | 0.000168 |
---------------------------------
---------------------------------
| explained_variance | 0.446    |
| fps                | 853      |
| nupdates           | 1955600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9778000  |
| value_loss         | 2.28e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.246    |
| fps                | 853      |
| nupdates           | 1955700  |
| policy_entropy     | 1.99     |
| total_timesteps    | 9778500  |
| value_loss         | 0.000219 |
---------------------------------
----------------------------------
| explained_variance | -7.55e+03 |
| fps                | 853       |
| nupdates           | 1955800   |
| policy_entropy     | 2         |
| total_t

---------------------------------
| explained_variance | 0.727    |
| fps                | 853      |
| nupdates           | 1958600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9793000  |
| value_loss         | 0.000239 |
---------------------------------
---------------------------------
| explained_variance | 0.752    |
| fps                | 853      |
| nupdates           | 1958700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9793500  |
| value_loss         | 0.000307 |
---------------------------------
---------------------------------
| explained_variance | 0.886    |
| fps                | 853      |
| nupdates           | 1958800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9794000  |
| value_loss         | 9.5e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.222    |
| fps                | 853      |
| nupdates           | 1958900  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.65     |
| fps                | 853      |
| nupdates           | 1961600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9808000  |
| value_loss         | 0.000153 |
---------------------------------
---------------------------------
| explained_variance | 0.859    |
| fps                | 853      |
| nupdates           | 1961700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9808500  |
| value_loss         | 2.71e-05 |
---------------------------------
---------------------------------
| explained_variance | -22.7    |
| fps                | 853      |
| nupdates           | 1961800  |
| policy_entropy     | 1.94     |
| total_timesteps    | 9809000  |
| value_loss         | 0.0164   |
---------------------------------
---------------------------------
| explained_variance | 0.417    |
| fps                | 853      |
| nupdates           | 1961900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.827    |
| fps                | 853      |
| nupdates           | 1964700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9823500  |
| value_loss         | 4.43e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.999    |
| fps                | 853      |
| nupdates           | 1964800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9824000  |
| value_loss         | 3.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.381    |
| fps                | 853      |
| nupdates           | 1964900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9824500  |
| value_loss         | 7.46e-05 |
---------------------------------
Eval num_timesteps=9825000, episode_reward=-4.90 +/- 0.30
Episode length: 808.00 +/- 202.74
---------------------------------
| explained_variance | -7.81    |
| fps                | 8

---------------------------------
| explained_variance | 0.218    |
| fps                | 853      |
| nupdates           | 1967700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9838500  |
| value_loss         | 0.000153 |
---------------------------------
---------------------------------
| explained_variance | 0.189    |
| fps                | 853      |
| nupdates           | 1967800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 9839000  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | 0.999    |
| fps                | 853      |
| nupdates           | 1967900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9839500  |
| value_loss         | 5.99e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.853    |
| fps                | 853      |
| nupdates           | 1968000  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.858    |
| fps                | 853      |
| nupdates           | 1970700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9853500  |
| value_loss         | 2.25e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.353    |
| fps                | 853      |
| nupdates           | 1970800  |
| policy_entropy     | 1.98     |
| total_timesteps    | 9854000  |
| value_loss         | 0.103    |
---------------------------------
---------------------------------
| explained_variance | 0.952    |
| fps                | 853      |
| nupdates           | 1970900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9854500  |
| value_loss         | 6.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.96     |
| fps                | 853      |
| nupdates           | 1971000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.04    |
| fps                | 854      |
| nupdates           | 1973800  |
| policy_entropy     | 2.03     |
| total_timesteps    | 9869000  |
| value_loss         | 4.94e-05 |
---------------------------------
---------------------------------
| explained_variance | -20.3    |
| fps                | 854      |
| nupdates           | 1973900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 9869500  |
| value_loss         | 0.0022   |
---------------------------------
---------------------------------
| explained_variance | 0.864    |
| fps                | 854      |
| nupdates           | 1974000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9870000  |
| value_loss         | 7.62e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.588    |
| fps                | 854      |
| nupdates           | 1974100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.0396   |
| fps                | 854      |
| nupdates           | 1976800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9884000  |
| value_loss         | 0.00023  |
---------------------------------
---------------------------------
| explained_variance | -0.355   |
| fps                | 854      |
| nupdates           | 1976900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9884500  |
| value_loss         | 0.000165 |
---------------------------------
---------------------------------
| explained_variance | -73.2    |
| fps                | 854      |
| nupdates           | 1977000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9885000  |
| value_loss         | 0.00399  |
---------------------------------
---------------------------------
| explained_variance | 0.971    |
| fps                | 854      |
| nupdates           | 1977100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.243   |
| fps                | 854      |
| nupdates           | 1979900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9899500  |
| value_loss         | 0.000176 |
---------------------------------
Eval num_timesteps=9900000, episode_reward=-4.90 +/- 0.30
Episode length: 607.90 +/- 79.04
---------------------------------
| explained_variance | 0.9      |
| fps                | 854      |
| nupdates           | 1980000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9900000  |
| value_loss         | 0.000336 |
---------------------------------
---------------------------------
| explained_variance | 0.866    |
| fps                | 854      |
| nupdates           | 1980100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 9900500  |
| value_loss         | 1.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.617    |
| fps                | 85

---------------------------------
| explained_variance | -0.287   |
| fps                | 854      |
| nupdates           | 1982900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9914500  |
| value_loss         | 0.000341 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 854      |
| nupdates           | 1983000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9915000  |
| value_loss         | 1.83e-06 |
---------------------------------
---------------------------------
| explained_variance | -14.5    |
| fps                | 854      |
| nupdates           | 1983100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9915500  |
| value_loss         | 0.00675  |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 854      |
| nupdates           | 1983200  |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | 0.987    |
| fps                | 854      |
| nupdates           | 1985900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9929500  |
| value_loss         | 0.00123  |
---------------------------------
---------------------------------
| explained_variance | 0.464    |
| fps                | 854      |
| nupdates           | 1986000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9930000  |
| value_loss         | 0.000194 |
---------------------------------
---------------------------------
| explained_variance | 0.79     |
| fps                | 854      |
| nupdates           | 1986100  |
| policy_entropy     | 1.85     |
| total_timesteps    | 9930500  |
| value_loss         | 0.000642 |
---------------------------------
---------------------------------
| explained_variance | 0.984    |
| fps                | 854      |
| nupdates           | 1986200  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.131    |
| fps                | 854      |
| nupdates           | 1989000  |
| policy_entropy     | 2.03     |
| total_timesteps    | 9945000  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.879    |
| fps                | 854      |
| nupdates           | 1989100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9945500  |
| value_loss         | 0.000115 |
---------------------------------
---------------------------------
| explained_variance | 0.84     |
| fps                | 854      |
| nupdates           | 1989200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9946000  |
| value_loss         | 7.52e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.933    |
| fps                | 854      |
| nupdates           | 1989300  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.793    |
| fps                | 854      |
| nupdates           | 1992000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9960000  |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | 0.138    |
| fps                | 854      |
| nupdates           | 1992100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9960500  |
| value_loss         | 0.000114 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 854      |
| nupdates           | 1992200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9961000  |
| value_loss         | 2.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.613    |
| fps                | 854      |
| nupdates           | 1992300  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.363    |
| fps                | 854      |
| nupdates           | 1995100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 9975500  |
| value_loss         | 0.15     |
---------------------------------
---------------------------------
| explained_variance | 0.892    |
| fps                | 854      |
| nupdates           | 1995200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 9976000  |
| value_loss         | 4.15e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.166   |
| fps                | 854      |
| nupdates           | 1995300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 9976500  |
| value_loss         | 0.00106  |
---------------------------------
---------------------------------
| explained_variance | 0.832    |
| fps                | 854      |
| nupdates           | 1995400  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.325    |
| fps                | 854      |
| nupdates           | 1998200  |
| policy_entropy     | 1.96     |
| total_timesteps    | 9991000  |
| value_loss         | 0.000141 |
---------------------------------
---------------------------------
| explained_variance | 0.975    |
| fps                | 854      |
| nupdates           | 1998300  |
| policy_entropy     | 2.02     |
| total_timesteps    | 9991500  |
| value_loss         | 0.00192  |
---------------------------------
---------------------------------
| explained_variance | 0.347    |
| fps                | 854      |
| nupdates           | 1998400  |
| policy_entropy     | 2.02     |
| total_timesteps    | 9992000  |
| value_loss         | 7.63e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.66    |
| fps                | 854      |
| nupdates           | 1998500  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.936    |
| fps                | 854      |
| nupdates           | 2001200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10006000 |
| value_loss         | 5.06e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.51    |
| fps                | 854      |
| nupdates           | 2001300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 10006500 |
| value_loss         | 0.000265 |
---------------------------------
---------------------------------
| explained_variance | 0.775    |
| fps                | 854      |
| nupdates           | 2001400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10007000 |
| value_loss         | 6.09e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.955    |
| fps                | 854      |
| nupdates           | 2001500  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.713   |
| fps                | 854      |
| nupdates           | 2004300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10021500 |
| value_loss         | 0.000169 |
---------------------------------
---------------------------------
| explained_variance | 0.132    |
| fps                | 854      |
| nupdates           | 2004400  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10022000 |
| value_loss         | 8.98e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.843    |
| fps                | 855      |
| nupdates           | 2004500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10022500 |
| value_loss         | 0.000128 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 855      |
| nupdates           | 2004600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.868    |
| fps                | 855      |
| nupdates           | 2007300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10036500 |
| value_loss         | 7.56e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.108   |
| fps                | 855      |
| nupdates           | 2007400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10037000 |
| value_loss         | 3e-05    |
---------------------------------
---------------------------------
| explained_variance | -0.82    |
| fps                | 855      |
| nupdates           | 2007500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10037500 |
| value_loss         | 0.000349 |
---------------------------------
---------------------------------
| explained_variance | -639     |
| fps                | 855      |
| nupdates           | 2007600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.407    |
| fps                | 855      |
| nupdates           | 2010300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10051500 |
| value_loss         | 0.00016  |
---------------------------------
---------------------------------
| explained_variance | -6.2     |
| fps                | 855      |
| nupdates           | 2010400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10052000 |
| value_loss         | 0.00258  |
---------------------------------
----------------------------------
| explained_variance | -1.47e+03 |
| fps                | 855       |
| nupdates           | 2010500   |
| policy_entropy     | 2.04      |
| total_timesteps    | 10052500  |
| value_loss         | 0.0917    |
----------------------------------
---------------------------------
| explained_variance | 0.903    |
| fps                | 855      |
| nupdates           | 2010600  |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | 0.833    |
| fps                | 855      |
| nupdates           | 2013400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10067000 |
| value_loss         | 1.71e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.58    |
| fps                | 855      |
| nupdates           | 2013500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10067500 |
| value_loss         | 0.00201  |
---------------------------------
---------------------------------
| explained_variance | 0.208    |
| fps                | 855      |
| nupdates           | 2013600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10068000 |
| value_loss         | 4.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.963    |
| fps                | 855      |
| nupdates           | 2013700  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.942    |
| fps                | 855      |
| nupdates           | 2016400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10082000 |
| value_loss         | 1.43e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.21     |
| fps                | 855      |
| nupdates           | 2016500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10082500 |
| value_loss         | 0.000428 |
---------------------------------
---------------------------------
| explained_variance | -1.1     |
| fps                | 855      |
| nupdates           | 2016600  |
| policy_entropy     | 2.02     |
| total_timesteps    | 10083000 |
| value_loss         | 0.000256 |
---------------------------------
---------------------------------
| explained_variance | 0.0838   |
| fps                | 855      |
| nupdates           | 2016700  |
| policy_entropy     | 1.99     |
| total_timest

---------------------------------
| explained_variance | 0.897    |
| fps                | 855      |
| nupdates           | 2019500  |
| policy_entropy     | 1.97     |
| total_timesteps    | 10097500 |
| value_loss         | 4.7e-05  |
---------------------------------
---------------------------------
| explained_variance | -9.8     |
| fps                | 855      |
| nupdates           | 2019600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10098000 |
| value_loss         | 0.000927 |
---------------------------------
---------------------------------
| explained_variance | 0.887    |
| fps                | 855      |
| nupdates           | 2019700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10098500 |
| value_loss         | 2.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 855      |
| nupdates           | 2019800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.25    |
| fps                | 855      |
| nupdates           | 2022500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10112500 |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | 0.797    |
| fps                | 855      |
| nupdates           | 2022600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10113000 |
| value_loss         | 6.32e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.858    |
| fps                | 855      |
| nupdates           | 2022700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10113500 |
| value_loss         | 5.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 855      |
| nupdates           | 2022800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.438    |
| fps                | 855      |
| nupdates           | 2025500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10127500 |
| value_loss         | 1.64e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.296    |
| fps                | 855      |
| nupdates           | 2025600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10128000 |
| value_loss         | 0.000263 |
---------------------------------
---------------------------------
| explained_variance | 0.938    |
| fps                | 855      |
| nupdates           | 2025700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10128500 |
| value_loss         | 2.7e-05  |
---------------------------------
----------------------------------
| explained_variance | -1.84e+04 |
| fps                | 855       |
| nupdates           | 2025800   |
| policy_entropy     | 2.07      |
| total_t

---------------------------------
| explained_variance | 0.937    |
| fps                | 855      |
| nupdates           | 2028600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10143000 |
| value_loss         | 0.000144 |
---------------------------------
---------------------------------
| explained_variance | 0.0173   |
| fps                | 855      |
| nupdates           | 2028700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10143500 |
| value_loss         | 0.159    |
---------------------------------
---------------------------------
| explained_variance | 0.968    |
| fps                | 855      |
| nupdates           | 2028800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10144000 |
| value_loss         | 1.97e-05 |
---------------------------------
---------------------------------
| explained_variance | -7       |
| fps                | 855      |
| nupdates           | 2028900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.68     |
| fps                | 855      |
| nupdates           | 2031600  |
| policy_entropy     | 2.01     |
| total_timesteps    | 10158000 |
| value_loss         | 0.000123 |
---------------------------------
---------------------------------
| explained_variance | 0.984    |
| fps                | 855      |
| nupdates           | 2031700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10158500 |
| value_loss         | 9.18e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.0482  |
| fps                | 855      |
| nupdates           | 2031800  |
| policy_entropy     | 0.762    |
| total_timesteps    | 10159000 |
| value_loss         | 0.9      |
---------------------------------
---------------------------------
| explained_variance | 0.886    |
| fps                | 855      |
| nupdates           | 2031900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0135  |
| fps                | 856      |
| nupdates           | 2034700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10173500 |
| value_loss         | 0.000143 |
---------------------------------
---------------------------------
| explained_variance | -14      |
| fps                | 856      |
| nupdates           | 2034800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10174000 |
| value_loss         | 0.00199  |
---------------------------------
---------------------------------
| explained_variance | 0.987    |
| fps                | 856      |
| nupdates           | 2034900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10174500 |
| value_loss         | 2.44e-06 |
---------------------------------
Eval num_timesteps=10175000, episode_reward=-5.00 +/- 0.00
Episode length: 602.40 +/- 104.29
---------------------------------
| explained_variance | 0.0633   |
| fps                | 

---------------------------------
| explained_variance | -0.287   |
| fps                | 856      |
| nupdates           | 2037700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 10188500 |
| value_loss         | 3.46e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.838    |
| fps                | 856      |
| nupdates           | 2037800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10189000 |
| value_loss         | 2.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 856      |
| nupdates           | 2037900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 10189500 |
| value_loss         | 3.47e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.56    |
| fps                | 856      |
| nupdates           | 2038000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.702   |
| fps                | 856      |
| nupdates           | 2040700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10203500 |
| value_loss         | 0.000354 |
---------------------------------
---------------------------------
| explained_variance | 0.293    |
| fps                | 856      |
| nupdates           | 2040800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10204000 |
| value_loss         | 5.74e-05 |
---------------------------------
---------------------------------
| explained_variance | -44.6    |
| fps                | 856      |
| nupdates           | 2040900  |
| policy_entropy     | 2        |
| total_timesteps    | 10204500 |
| value_loss         | 0.0022   |
---------------------------------
---------------------------------
| explained_variance | 0.0891   |
| fps                | 856      |
| nupdates           | 2041000  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.013   |
| fps                | 856      |
| nupdates           | 2043800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10219000 |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.901    |
| fps                | 856      |
| nupdates           | 2043900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10219500 |
| value_loss         | 6.69e-05 |
---------------------------------
----------------------------------
| explained_variance | -0.000174 |
| fps                | 856       |
| nupdates           | 2044000   |
| policy_entropy     | 2.05      |
| total_timesteps    | 10220000  |
| value_loss         | 0.157     |
----------------------------------
---------------------------------
| explained_variance | 0.344    |
| fps                | 856      |
| nupdates           | 2044100  |
| policy_entropy     | 1.98     |
| tota

---------------------------------
| explained_variance | 0.925    |
| fps                | 856      |
| nupdates           | 2046800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10234000 |
| value_loss         | 0.000133 |
---------------------------------
---------------------------------
| explained_variance | 0.176    |
| fps                | 856      |
| nupdates           | 2046900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10234500 |
| value_loss         | 1.86e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.326    |
| fps                | 856      |
| nupdates           | 2047000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10235000 |
| value_loss         | 7.68e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.07    |
| fps                | 856      |
| nupdates           | 2047100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.418    |
| fps                | 856      |
| nupdates           | 2049900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10249500 |
| value_loss         | 5.8e-05  |
---------------------------------
Eval num_timesteps=10250000, episode_reward=-4.90 +/- 0.30
Episode length: 576.40 +/- 92.67
---------------------------------
| explained_variance | -1.19    |
| fps                | 856      |
| nupdates           | 2050000  |
| policy_entropy     | 2.02     |
| total_timesteps    | 10250000 |
| value_loss         | 0.000125 |
---------------------------------
---------------------------------
| explained_variance | 0.818    |
| fps                | 856      |
| nupdates           | 2050100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10250500 |
| value_loss         | 5.07e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.314   |
| fps                | 8

---------------------------------
| explained_variance | 0.987    |
| fps                | 856      |
| nupdates           | 2052900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10264500 |
| value_loss         | 1.47e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.556    |
| fps                | 856      |
| nupdates           | 2053000  |
| policy_entropy     | 1.99     |
| total_timesteps    | 10265000 |
| value_loss         | 7.62e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.674    |
| fps                | 856      |
| nupdates           | 2053100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10265500 |
| value_loss         | 0.0001   |
---------------------------------
---------------------------------
| explained_variance | 0.241    |
| fps                | 856      |
| nupdates           | 2053200  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.86     |
| fps                | 856      |
| nupdates           | 2055900  |
| policy_entropy     | 2.01     |
| total_timesteps    | 10279500 |
| value_loss         | 0.000513 |
---------------------------------
---------------------------------
| explained_variance | 0.73     |
| fps                | 856      |
| nupdates           | 2056000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10280000 |
| value_loss         | 2.59e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.17    |
| fps                | 856      |
| nupdates           | 2056100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10280500 |
| value_loss         | 0.000382 |
---------------------------------
---------------------------------
| explained_variance | -3.45    |
| fps                | 856      |
| nupdates           | 2056200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.634    |
| fps                | 856      |
| nupdates           | 2059000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10295000 |
| value_loss         | 6.77e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 856      |
| nupdates           | 2059100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10295500 |
| value_loss         | 1.77e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.05    |
| fps                | 856      |
| nupdates           | 2059200  |
| policy_entropy     | 2.02     |
| total_timesteps    | 10296000 |
| value_loss         | 0.000621 |
---------------------------------
---------------------------------
| explained_variance | -0.994   |
| fps                | 856      |
| nupdates           | 2059300  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.39    |
| fps                | 856      |
| nupdates           | 2062000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10310000 |
| value_loss         | 0.000164 |
---------------------------------
---------------------------------
| explained_variance | 0.62     |
| fps                | 856      |
| nupdates           | 2062100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10310500 |
| value_loss         | 0.00038  |
---------------------------------
---------------------------------
| explained_variance | 0.846    |
| fps                | 856      |
| nupdates           | 2062200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10311000 |
| value_loss         | 0.000155 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 856      |
| nupdates           | 2062300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.827    |
| fps                | 856      |
| nupdates           | 2065100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10325500 |
| value_loss         | 0.000224 |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 856      |
| nupdates           | 2065200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10326000 |
| value_loss         | 2.14e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.862    |
| fps                | 856      |
| nupdates           | 2065300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10326500 |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | 0.777    |
| fps                | 856      |
| nupdates           | 2065400  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.988    |
| fps                | 856      |
| nupdates           | 2068200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10341000 |
| value_loss         | 5.24e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.842    |
| fps                | 856      |
| nupdates           | 2068300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10341500 |
| value_loss         | 3.62e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.846    |
| fps                | 856      |
| nupdates           | 2068400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10342000 |
| value_loss         | 9.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.248    |
| fps                | 857      |
| nupdates           | 2068500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.965    |
| fps                | 857      |
| nupdates           | 2071200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10356000 |
| value_loss         | 0.000193 |
---------------------------------
---------------------------------
| explained_variance | 0.913    |
| fps                | 857      |
| nupdates           | 2071300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10356500 |
| value_loss         | 2.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.125    |
| fps                | 857      |
| nupdates           | 2071400  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10357000 |
| value_loss         | 7.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.735    |
| fps                | 857      |
| nupdates           | 2071500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.984    |
| fps                | 857      |
| nupdates           | 2074300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10371500 |
| value_loss         | 0.00259  |
---------------------------------
---------------------------------
| explained_variance | 0.951    |
| fps                | 857      |
| nupdates           | 2074400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10372000 |
| value_loss         | 6.93e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.89    |
| fps                | 857      |
| nupdates           | 2074500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10372500 |
| value_loss         | 0.00249  |
---------------------------------
---------------------------------
| explained_variance | -5.31    |
| fps                | 857      |
| nupdates           | 2074600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.398    |
| fps                | 857      |
| nupdates           | 2077300  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10386500 |
| value_loss         | 0.000604 |
---------------------------------
---------------------------------
| explained_variance | -2.58    |
| fps                | 857      |
| nupdates           | 2077400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10387000 |
| value_loss         | 3.38e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.53    |
| fps                | 857      |
| nupdates           | 2077500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10387500 |
| value_loss         | 0.000102 |
---------------------------------
---------------------------------
| explained_variance | 0.829    |
| fps                | 857      |
| nupdates           | 2077600  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.996    |
| fps                | 857      |
| nupdates           | 2080300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10401500 |
| value_loss         | 5.08e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.418   |
| fps                | 857      |
| nupdates           | 2080400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10402000 |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | 0.65     |
| fps                | 857      |
| nupdates           | 2080500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10402500 |
| value_loss         | 8.84e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.845    |
| fps                | 857      |
| nupdates           | 2080600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.676   |
| fps                | 857      |
| nupdates           | 2083400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10417000 |
| value_loss         | 0.00109  |
---------------------------------
---------------------------------
| explained_variance | 0.888    |
| fps                | 857      |
| nupdates           | 2083500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10417500 |
| value_loss         | 1.68e-05 |
---------------------------------
---------------------------------
| explained_variance | -5.63    |
| fps                | 857      |
| nupdates           | 2083600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10418000 |
| value_loss         | 0.000395 |
---------------------------------
---------------------------------
| explained_variance | 0.322    |
| fps                | 857      |
| nupdates           | 2083700  |
| policy_entropy     | 1.9      |
| total_timest

---------------------------------
| explained_variance | 0.866    |
| fps                | 857      |
| nupdates           | 2086400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10432000 |
| value_loss         | 2.69e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.392    |
| fps                | 857      |
| nupdates           | 2086500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10432500 |
| value_loss         | 0.000742 |
---------------------------------
---------------------------------
| explained_variance | -0.00824 |
| fps                | 857      |
| nupdates           | 2086600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10433000 |
| value_loss         | 0.000873 |
---------------------------------
---------------------------------
| explained_variance | 0.554    |
| fps                | 857      |
| nupdates           | 2086700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.978    |
| fps                | 857      |
| nupdates           | 2089500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10447500 |
| value_loss         | 2.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.579    |
| fps                | 857      |
| nupdates           | 2089600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10448000 |
| value_loss         | 6.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.71     |
| fps                | 857      |
| nupdates           | 2089700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10448500 |
| value_loss         | 7.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.921    |
| fps                | 857      |
| nupdates           | 2089800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.629    |
| fps                | 857      |
| nupdates           | 2092500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10462500 |
| value_loss         | 0.000604 |
---------------------------------
---------------------------------
| explained_variance | 0.941    |
| fps                | 857      |
| nupdates           | 2092600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10463000 |
| value_loss         | 3.66e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.757    |
| fps                | 857      |
| nupdates           | 2092700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10463500 |
| value_loss         | 0.000129 |
---------------------------------
---------------------------------
| explained_variance | 0.926    |
| fps                | 857      |
| nupdates           | 2092800  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.153   |
| fps                | 857      |
| nupdates           | 2095500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10477500 |
| value_loss         | 0.0012   |
---------------------------------
---------------------------------
| explained_variance | 0.287    |
| fps                | 857      |
| nupdates           | 2095600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10478000 |
| value_loss         | 0.000208 |
---------------------------------
---------------------------------
| explained_variance | -0.831   |
| fps                | 857      |
| nupdates           | 2095700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10478500 |
| value_loss         | 0.000476 |
---------------------------------
---------------------------------
| explained_variance | 0.985    |
| fps                | 857      |
| nupdates           | 2095800  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -28.7    |
| fps                | 857      |
| nupdates           | 2098600  |
| policy_entropy     | 2.03     |
| total_timesteps    | 10493000 |
| value_loss         | 0.000659 |
---------------------------------
---------------------------------
| explained_variance | -1.32    |
| fps                | 857      |
| nupdates           | 2098700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10493500 |
| value_loss         | 7.11e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.903    |
| fps                | 857      |
| nupdates           | 2098800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10494000 |
| value_loss         | 1.43e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.145   |
| fps                | 857      |
| nupdates           | 2098900  |
| policy_entropy     | 1.67     |
| total_timest

---------------------------------
| explained_variance | -12.5    |
| fps                | 857      |
| nupdates           | 2101600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10508000 |
| value_loss         | 0.00308  |
---------------------------------
---------------------------------
| explained_variance | 0.941    |
| fps                | 857      |
| nupdates           | 2101700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10508500 |
| value_loss         | 5.32e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.03    |
| fps                | 857      |
| nupdates           | 2101800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10509000 |
| value_loss         | 2.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.56     |
| fps                | 857      |
| nupdates           | 2101900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.0387   |
| fps                | 857      |
| nupdates           | 2104700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10523500 |
| value_loss         | 2.57e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.788    |
| fps                | 857      |
| nupdates           | 2104800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10524000 |
| value_loss         | 0.000339 |
---------------------------------
---------------------------------
| explained_variance | 0.886    |
| fps                | 857      |
| nupdates           | 2104900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10524500 |
| value_loss         | 0.000105 |
---------------------------------
Eval num_timesteps=10525000, episode_reward=-5.00 +/- 0.00
Episode length: 643.10 +/- 139.19
---------------------------------
| explained_variance | 0.235    |
| fps                | 

---------------------------------
| explained_variance | 0.967    |
| fps                | 857      |
| nupdates           | 2107700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10538500 |
| value_loss         | 3.16e-06 |
---------------------------------
---------------------------------
| explained_variance | -5.37    |
| fps                | 857      |
| nupdates           | 2107800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10539000 |
| value_loss         | 0.00138  |
---------------------------------
---------------------------------
| explained_variance | 0.87     |
| fps                | 857      |
| nupdates           | 2107900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10539500 |
| value_loss         | 3.28e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.984    |
| fps                | 857      |
| nupdates           | 2108000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.376    |
| fps                | 857      |
| nupdates           | 2110700  |
| policy_entropy     | 1.93     |
| total_timesteps    | 10553500 |
| value_loss         | 0.0011   |
---------------------------------
---------------------------------
| explained_variance | 0.901    |
| fps                | 857      |
| nupdates           | 2110800  |
| policy_entropy     | 1.97     |
| total_timesteps    | 10554000 |
| value_loss         | 4.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.962    |
| fps                | 857      |
| nupdates           | 2110900  |
| policy_entropy     | 2.01     |
| total_timesteps    | 10554500 |
| value_loss         | 1.45e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.62    |
| fps                | 857      |
| nupdates           | 2111000  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.32    |
| fps                | 857      |
| nupdates           | 2113800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10569000 |
| value_loss         | 0.000967 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 857      |
| nupdates           | 2113900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10569500 |
| value_loss         | 1.1e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.678    |
| fps                | 857      |
| nupdates           | 2114000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10570000 |
| value_loss         | 4.68e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.34    |
| fps                | 857      |
| nupdates           | 2114100  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.944    |
| fps                | 857      |
| nupdates           | 2116800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10584000 |
| value_loss         | 1.95e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.951    |
| fps                | 857      |
| nupdates           | 2116900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10584500 |
| value_loss         | 2.72e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.688    |
| fps                | 857      |
| nupdates           | 2117000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10585000 |
| value_loss         | 3.46e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 857      |
| nupdates           | 2117100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.772    |
| fps                | 857      |
| nupdates           | 2119900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10599500 |
| value_loss         | 0.000264 |
---------------------------------
Eval num_timesteps=10600000, episode_reward=-4.80 +/- 0.40
Episode length: 551.50 +/- 96.61
---------------------------------
| explained_variance | 0.992    |
| fps                | 857      |
| nupdates           | 2120000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10600000 |
| value_loss         | 1.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.739    |
| fps                | 857      |
| nupdates           | 2120100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10600500 |
| value_loss         | 2.41e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.43     |
| fps                | 8

---------------------------------
| explained_variance | -14      |
| fps                | 857      |
| nupdates           | 2122900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 10614500 |
| value_loss         | 0.00444  |
---------------------------------
---------------------------------
| explained_variance | 0.969    |
| fps                | 857      |
| nupdates           | 2123000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10615000 |
| value_loss         | 4.81e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.846    |
| fps                | 857      |
| nupdates           | 2123100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10615500 |
| value_loss         | 1.59e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.7     |
| fps                | 857      |
| nupdates           | 2123200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.99     |
| fps                | 857      |
| nupdates           | 2125900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10629500 |
| value_loss         | 5.13e-07 |
---------------------------------
---------------------------------
| explained_variance | -99.7    |
| fps                | 857      |
| nupdates           | 2126000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10630000 |
| value_loss         | 0.00819  |
---------------------------------
---------------------------------
| explained_variance | 0.933    |
| fps                | 857      |
| nupdates           | 2126100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10630500 |
| value_loss         | 1.38e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 857      |
| nupdates           | 2126200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.25    |
| fps                | 857      |
| nupdates           | 2129000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10645000 |
| value_loss         | 0.000559 |
---------------------------------
---------------------------------
| explained_variance | 0.659    |
| fps                | 857      |
| nupdates           | 2129100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10645500 |
| value_loss         | 0.000276 |
---------------------------------
---------------------------------
| explained_variance | -84.4    |
| fps                | 857      |
| nupdates           | 2129200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10646000 |
| value_loss         | 0.0146   |
---------------------------------
---------------------------------
| explained_variance | -1.85    |
| fps                | 857      |
| nupdates           | 2129300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.117    |
| fps                | 857      |
| nupdates           | 2132000  |
| policy_entropy     | 1.98     |
| total_timesteps    | 10660000 |
| value_loss         | 0.000262 |
---------------------------------
---------------------------------
| explained_variance | -0.701   |
| fps                | 857      |
| nupdates           | 2132100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10660500 |
| value_loss         | 0.00285  |
---------------------------------
---------------------------------
| explained_variance | 0.542    |
| fps                | 857      |
| nupdates           | 2132200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10661000 |
| value_loss         | 0.000279 |
---------------------------------
---------------------------------
| explained_variance | 0.594    |
| fps                | 857      |
| nupdates           | 2132300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.889    |
| fps                | 857      |
| nupdates           | 2135100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10675500 |
| value_loss         | 2e-05    |
---------------------------------
---------------------------------
| explained_variance | -1.04    |
| fps                | 857      |
| nupdates           | 2135200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10676000 |
| value_loss         | 3.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.565    |
| fps                | 857      |
| nupdates           | 2135300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10676500 |
| value_loss         | 0.000149 |
---------------------------------
---------------------------------
| explained_variance | 0.203    |
| fps                | 857      |
| nupdates           | 2135400  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.632    |
| fps                | 857      |
| nupdates           | 2138200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10691000 |
| value_loss         | 1.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.961    |
| fps                | 857      |
| nupdates           | 2138300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10691500 |
| value_loss         | 1.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.153    |
| fps                | 857      |
| nupdates           | 2138400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10692000 |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | 0.811    |
| fps                | 857      |
| nupdates           | 2138500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.0632  |
| fps                | 857      |
| nupdates           | 2141200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10706000 |
| value_loss         | 0.000367 |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 857      |
| nupdates           | 2141300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10706500 |
| value_loss         | 2.63e-05 |
---------------------------------
---------------------------------
| explained_variance | -40.5    |
| fps                | 857      |
| nupdates           | 2141400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10707000 |
| value_loss         | 0.00247  |
---------------------------------
---------------------------------
| explained_variance | -6       |
| fps                | 857      |
| nupdates           | 2141500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.781    |
| fps                | 857      |
| nupdates           | 2144300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10721500 |
| value_loss         | 7.86e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 857      |
| nupdates           | 2144400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10722000 |
| value_loss         | 0.00046  |
---------------------------------
---------------------------------
| explained_variance | -150     |
| fps                | 857      |
| nupdates           | 2144500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10722500 |
| value_loss         | 0.043    |
---------------------------------
---------------------------------
| explained_variance | -34.3    |
| fps                | 857      |
| nupdates           | 2144600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.944    |
| fps                | 857      |
| nupdates           | 2147300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10736500 |
| value_loss         | 3.67e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.32    |
| fps                | 857      |
| nupdates           | 2147400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10737000 |
| value_loss         | 0.000671 |
---------------------------------
---------------------------------
| explained_variance | 0.444    |
| fps                | 857      |
| nupdates           | 2147500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10737500 |
| value_loss         | 4.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.313    |
| fps                | 857      |
| nupdates           | 2147600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.882    |
| fps                | 857      |
| nupdates           | 2150300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10751500 |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | -1.41    |
| fps                | 857      |
| nupdates           | 2150400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10752000 |
| value_loss         | 0.000492 |
---------------------------------
---------------------------------
| explained_variance | 0.109    |
| fps                | 857      |
| nupdates           | 2150500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10752500 |
| value_loss         | 8.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 857      |
| nupdates           | 2150600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.957    |
| fps                | 857      |
| nupdates           | 2153400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10767000 |
| value_loss         | 1.33e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.08    |
| fps                | 857      |
| nupdates           | 2153500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10767500 |
| value_loss         | 0.00273  |
---------------------------------
---------------------------------
| explained_variance | 0.869    |
| fps                | 857      |
| nupdates           | 2153600  |
| policy_entropy     | 2        |
| total_timesteps    | 10768000 |
| value_loss         | 7.55e-05 |
---------------------------------
---------------------------------
| explained_variance | -10.7    |
| fps                | 857      |
| nupdates           | 2153700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.366    |
| fps                | 857      |
| nupdates           | 2156400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10782000 |
| value_loss         | 0.00035  |
---------------------------------
---------------------------------
| explained_variance | 0.868    |
| fps                | 857      |
| nupdates           | 2156500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10782500 |
| value_loss         | 2.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.192    |
| fps                | 857      |
| nupdates           | 2156600  |
| policy_entropy     | 1.93     |
| total_timesteps    | 10783000 |
| value_loss         | 0.000182 |
---------------------------------
---------------------------------
| explained_variance | 0.242    |
| fps                | 857      |
| nupdates           | 2156700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.901    |
| fps                | 858      |
| nupdates           | 2159500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10797500 |
| value_loss         | 4.88e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.245   |
| fps                | 858      |
| nupdates           | 2159600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10798000 |
| value_loss         | 1.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.929    |
| fps                | 858      |
| nupdates           | 2159700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10798500 |
| value_loss         | 6.1e-06  |
---------------------------------
---------------------------------
| explained_variance | -36.4    |
| fps                | 858      |
| nupdates           | 2159800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.781    |
| fps                | 858      |
| nupdates           | 2162500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10812500 |
| value_loss         | 4.2e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.808    |
| fps                | 858      |
| nupdates           | 2162600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10813000 |
| value_loss         | 9.71e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.06    |
| fps                | 858      |
| nupdates           | 2162700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10813500 |
| value_loss         | 0.000125 |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 858      |
| nupdates           | 2162800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.902    |
| fps                | 858      |
| nupdates           | 2165500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10827500 |
| value_loss         | 1.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.756    |
| fps                | 858      |
| nupdates           | 2165600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10828000 |
| value_loss         | 0.000142 |
---------------------------------
---------------------------------
| explained_variance | -0.0661  |
| fps                | 858      |
| nupdates           | 2165700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10828500 |
| value_loss         | 0.000249 |
---------------------------------
---------------------------------
| explained_variance | -0.762   |
| fps                | 858      |
| nupdates           | 2165800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.212   |
| fps                | 858      |
| nupdates           | 2168600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10843000 |
| value_loss         | 6.45e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.472    |
| fps                | 858      |
| nupdates           | 2168700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10843500 |
| value_loss         | 0.00116  |
---------------------------------
---------------------------------
| explained_variance | -0.223   |
| fps                | 858      |
| nupdates           | 2168800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10844000 |
| value_loss         | 0.000295 |
---------------------------------
---------------------------------
| explained_variance | 0.929    |
| fps                | 858      |
| nupdates           | 2168900  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -3.77    |
| fps                | 858      |
| nupdates           | 2171600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10858000 |
| value_loss         | 0.00236  |
---------------------------------
---------------------------------
| explained_variance | -0.257   |
| fps                | 858      |
| nupdates           | 2171700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10858500 |
| value_loss         | 0.000128 |
---------------------------------
---------------------------------
| explained_variance | 0.186    |
| fps                | 858      |
| nupdates           | 2171800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10859000 |
| value_loss         | 0.000135 |
---------------------------------
---------------------------------
| explained_variance | 0.926    |
| fps                | 858      |
| nupdates           | 2171900  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.09    |
| fps                | 858      |
| nupdates           | 2174700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10873500 |
| value_loss         | 0.000248 |
---------------------------------
---------------------------------
| explained_variance | 0.979    |
| fps                | 858      |
| nupdates           | 2174800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10874000 |
| value_loss         | 6.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.923    |
| fps                | 858      |
| nupdates           | 2174900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10874500 |
| value_loss         | 3.84e-05 |
---------------------------------
Eval num_timesteps=10875000, episode_reward=-4.90 +/- 0.30
Episode length: 612.10 +/- 113.04
---------------------------------
| explained_variance | -0.18    |
| fps                | 

---------------------------------
| explained_variance | 0.484    |
| fps                | 858      |
| nupdates           | 2177700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10888500 |
| value_loss         | 0.000394 |
---------------------------------
---------------------------------
| explained_variance | 0.812    |
| fps                | 858      |
| nupdates           | 2177800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10889000 |
| value_loss         | 0.000426 |
---------------------------------
---------------------------------
| explained_variance | -0.155   |
| fps                | 858      |
| nupdates           | 2177900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10889500 |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | -0.816   |
| fps                | 859      |
| nupdates           | 2178000  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.639    |
| fps                | 858      |
| nupdates           | 2180700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10903500 |
| value_loss         | 0.00031  |
---------------------------------
---------------------------------
| explained_variance | 0.66     |
| fps                | 859      |
| nupdates           | 2180800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10904000 |
| value_loss         | 2.83e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.346   |
| fps                | 859      |
| nupdates           | 2180900  |
| policy_entropy     | 1.79     |
| total_timesteps    | 10904500 |
| value_loss         | 0.00399  |
---------------------------------
---------------------------------
| explained_variance | 0.695    |
| fps                | 859      |
| nupdates           | 2181000  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.956    |
| fps                | 859      |
| nupdates           | 2183800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10919000 |
| value_loss         | 9.21e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.751    |
| fps                | 859      |
| nupdates           | 2183900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10919500 |
| value_loss         | 1.54e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.897    |
| fps                | 859      |
| nupdates           | 2184000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10920000 |
| value_loss         | 2.82e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 859      |
| nupdates           | 2184100  |
| policy_entropy     | 1.76     |
| total_timest

---------------------------------
| explained_variance | 0.992    |
| fps                | 859      |
| nupdates           | 2186800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10934000 |
| value_loss         | 9.52e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 859      |
| nupdates           | 2186900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10934500 |
| value_loss         | 6.28e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.93     |
| fps                | 859      |
| nupdates           | 2187000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10935000 |
| value_loss         | 1.11e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.606   |
| fps                | 859      |
| nupdates           | 2187100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.943    |
| fps                | 859      |
| nupdates           | 2189900  |
| policy_entropy     | 2        |
| total_timesteps    | 10949500 |
| value_loss         | 1.18e-05 |
---------------------------------
Eval num_timesteps=10950000, episode_reward=-4.80 +/- 0.40
Episode length: 545.50 +/- 62.70
---------------------------------
| explained_variance | -0.979   |
| fps                | 859      |
| nupdates           | 2190000  |
| policy_entropy     | 2.01     |
| total_timesteps    | 10950000 |
| value_loss         | 0.000334 |
---------------------------------
---------------------------------
| explained_variance | -1.76    |
| fps                | 859      |
| nupdates           | 2190100  |
| policy_entropy     | 1.98     |
| total_timesteps    | 10950500 |
| value_loss         | 0.000275 |
---------------------------------
---------------------------------
| explained_variance | 0.937    |
| fps                | 8

---------------------------------
| explained_variance | 0.861    |
| fps                | 859      |
| nupdates           | 2192900  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10964500 |
| value_loss         | 7.41e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.02    |
| fps                | 859      |
| nupdates           | 2193000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10965000 |
| value_loss         | 0.000155 |
---------------------------------
---------------------------------
| explained_variance | -126     |
| fps                | 859      |
| nupdates           | 2193100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10965500 |
| value_loss         | 0.0251   |
---------------------------------
---------------------------------
| explained_variance | -7.21    |
| fps                | 859      |
| nupdates           | 2193200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -50      |
| fps                | 859      |
| nupdates           | 2195900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 10979500 |
| value_loss         | 0.011    |
---------------------------------
---------------------------------
| explained_variance | 0.721    |
| fps                | 859      |
| nupdates           | 2196000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10980000 |
| value_loss         | 3.14e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.03    |
| fps                | 859      |
| nupdates           | 2196100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 10980500 |
| value_loss         | 0.00185  |
---------------------------------
---------------------------------
| explained_variance | 0.663    |
| fps                | 859      |
| nupdates           | 2196200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.953    |
| fps                | 859      |
| nupdates           | 2199000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 10995000 |
| value_loss         | 3.79e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.16    |
| fps                | 859      |
| nupdates           | 2199100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 10995500 |
| value_loss         | 0.000449 |
---------------------------------
---------------------------------
| explained_variance | 0.781    |
| fps                | 859      |
| nupdates           | 2199200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 10996000 |
| value_loss         | 2.99e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.24    |
| fps                | 859      |
| nupdates           | 2199300  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -1.27    |
| fps                | 859      |
| nupdates           | 2202000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 11010000 |
| value_loss         | 7.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 859      |
| nupdates           | 2202100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 11010500 |
| value_loss         | 8.62e-07 |
---------------------------------
---------------------------------
| explained_variance | -2.02    |
| fps                | 859      |
| nupdates           | 2202200  |
| policy_entropy     | 2        |
| total_timesteps    | 11011000 |
| value_loss         | 0.00659  |
---------------------------------
---------------------------------
| explained_variance | 0.99     |
| fps                | 859      |
| nupdates           | 2202300  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.984    |
| fps                | 859      |
| nupdates           | 2205100  |
| policy_entropy     | 2.03     |
| total_timesteps    | 11025500 |
| value_loss         | 9.5e-06  |
---------------------------------
----------------------------------
| explained_variance | -5.16e+03 |
| fps                | 859       |
| nupdates           | 2205200   |
| policy_entropy     | 2         |
| total_timesteps    | 11026000  |
| value_loss         | 0.275     |
----------------------------------
---------------------------------
| explained_variance | -91      |
| fps                | 859      |
| nupdates           | 2205300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 11026500 |
| value_loss         | 0.0115   |
---------------------------------
---------------------------------
| explained_variance | 0.632    |
| fps                | 859      |
| nupdates           | 2205400  |
| policy_entropy     | 1.97     |
| tota

---------------------------------
| explained_variance | 0.887    |
| fps                | 859      |
| nupdates           | 2208200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 11041000 |
| value_loss         | 2.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0431   |
| fps                | 859      |
| nupdates           | 2208300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 11041500 |
| value_loss         | 0.000176 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 859      |
| nupdates           | 2208400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 11042000 |
| value_loss         | 0.000167 |
---------------------------------
---------------------------------
| explained_variance | -1.56    |
| fps                | 859      |
| nupdates           | 2208500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.963    |
| fps                | 859      |
| nupdates           | 2211200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 11056000 |
| value_loss         | 5.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.65     |
| fps                | 859      |
| nupdates           | 2211300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 11056500 |
| value_loss         | 0.000125 |
---------------------------------
---------------------------------
| explained_variance | -154     |
| fps                | 859      |
| nupdates           | 2211400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 11057000 |
| value_loss         | 0.0196   |
---------------------------------
---------------------------------
| explained_variance | -0.476   |
| fps                | 859      |
| nupdates           | 2211500  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -10.2    |
| fps                | 860      |
| nupdates           | 2214300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 11071500 |
| value_loss         | 0.000203 |
---------------------------------
---------------------------------
| explained_variance | 0.865    |
| fps                | 860      |
| nupdates           | 2214400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 11072000 |
| value_loss         | 4.61e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.339    |
| fps                | 860      |
| nupdates           | 2214500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 11072500 |
| value_loss         | 6.28e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.2     |
| fps                | 860      |
| nupdates           | 2214600  |
| policy_entropy     | 1.86     |
| total_timest

In [21]:
video_filename = 'a2c.mp4'
record_game(
    model=trained_model['a2c'],
    env=gym.make("SlimeVolley-v0"),
    num_episodes=5,
    video_filename=video_filename
)
embed_mp4(video_filename)



score: -5
score: -5
score: -5
score: -5
score: -5


In [None]:
experiment('acer')