# Stable-baselines algorithms experiment iteration

Algorithms
* A2C (no replay memory)
* ACER (no multibinary)
* ACKTR
* DDPG (continuous only)
* DQN (discrete action space only)
* HER (method wrapper for off-policy methods)
* GAIL (no multibinary)
* PPO
* SAC (continuous only)
* TD3 (continuous only)
* TRPO

In [1]:
import base64
import IPython
import imageio

def embed_mp4(filename):
    """Embeds an mp4 file in the notebook."""
    video = open(filename,'rb').read()
    b64 = base64.b64encode(video)
    tag = '''
    <video width="640" height="480" controls>
    <source src="data:video/mp4;base64,{0}" type="video/mp4">
    Your browser does not support the video tag.
    </video>'''.format(b64.decode())

    return IPython.display.HTML(tag)

def record_game(model, env, num_episodes=5, video_filename='video.mp4'):
    with imageio.get_writer(video_filename, fps=60) as video:
        for _ in range(num_episodes):
            obs = env.reset()
            done = False
            total_reward = 0
            video.append_data(env.render('rgb_array'))

            while not done:
                action, _steps = model.predict(obs)
                obs, reward, done, info = env.step(action)
                total_reward += reward
                video.append_data(env.render('rgb_array'))

            print("score:", total_reward)

In [2]:
import os
import gym
import slimevolleygym
from slimevolleygym import SurvivalRewardEnv

from stable_baselines.common.policies import MlpPolicy
from stable_baselines import logger
from stable_baselines.common.callbacks import EvalCallback

from stable_baselines.ppo1 import PPO1
from stable_baselines import A2C, ACER, ACKTR, DQN, HER, GAIL, TRPO

algo = {
    'a2c': A2C,
    'acer': ACER,
    'acktr': ACKTR,
    'dqn': DQN,
    'her': HER,
    'gail': GAIL,
    'trpo': TRPO,
}
trained_model = {}

The TensorFlow contrib module will not be included in TensorFlow 2.0.
For more information, please see:
  * https://github.com/tensorflow/community/blob/master/rfcs/20180907-contrib-sunset.md
  * https://github.com/tensorflow/addons
  * https://github.com/tensorflow/io (for I/O related ops)
If you depend on functionality not listed there, please file an issue.



In [8]:
def experiment(model_str, timesteps=15_000_000):
    NUM_TIMESTEPS = int(timesteps)
    SEED = 721
    EVAL_FREQ = 25000
    EVAL_EPISODES = 10  # was 1000
    LOGDIR = "sb-" + model_str

    logger.configure(folder=LOGDIR)
    env = gym.make("SlimeVolley-v0")
    env.seed(SEED)

    model = algo[model_str](MlpPolicy, env, verbose=2)
    trained_model[model_str] = model
    eval_callback = EvalCallback(env, best_model_save_path=LOGDIR, log_path=LOGDIR, eval_freq=EVAL_FREQ, n_eval_episodes=EVAL_EPISODES)
    model.learn(total_timesteps=NUM_TIMESTEPS, callback=eval_callback)
    model.save(os.path.join(LOGDIR, "final_model")) # probably never get to this point.
    env.close()

In [9]:
experiment('a2c')

Logging to sb-a2c
Wrapping the env in a DummyVecEnv.
----------------------------------
| explained_variance | -5.23e+03 |
| fps                | 33        |
| nupdates           | 1         |
| policy_entropy     | 2.08      |
| total_timesteps    | 5         |
| value_loss         | 0.107     |
----------------------------------
---------------------------------
| explained_variance | -246     |
| fps                | 767      |
| nupdates           | 100      |
| policy_entropy     | 2.08     |
| total_timesteps    | 500      |
| value_loss         | 0.000801 |
---------------------------------
---------------------------------
| explained_variance | -4.9e+03 |
| fps                | 881      |
| nupdates           | 200      |
| policy_entropy     | 2.08     |
| total_timesteps    | 1000     |
| value_loss         | 0.0119   |
---------------------------------
---------------------------------
| explained_variance | -5.79    |
| fps                | 930      |
| nupdates           

---------------------------------
| explained_variance | -12      |
| fps                | 1013     |
| nupdates           | 3000     |
| policy_entropy     | 2.01     |
| total_timesteps    | 15000    |
| value_loss         | 0.000368 |
---------------------------------
---------------------------------
| explained_variance | 0.487    |
| fps                | 1013     |
| nupdates           | 3100     |
| policy_entropy     | 2.05     |
| total_timesteps    | 15500    |
| value_loss         | 0.00196  |
---------------------------------
---------------------------------
| explained_variance | -5.68    |
| fps                | 1012     |
| nupdates           | 3200     |
| policy_entropy     | 2.02     |
| total_timesteps    | 16000    |
| value_loss         | 0.000413 |
---------------------------------
---------------------------------
| explained_variance | -910     |
| fps                | 1012     |
| nupdates           | 3300     |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -3.96    |
| fps                | 919      |
| nupdates           | 6000     |
| policy_entropy     | 2.06     |
| total_timesteps    | 30000    |
| value_loss         | 0.000334 |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 920      |
| nupdates           | 6100     |
| policy_entropy     | 2        |
| total_timesteps    | 30500    |
| value_loss         | 8.73e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.744    |
| fps                | 922      |
| nupdates           | 6200     |
| policy_entropy     | 2.07     |
| total_timesteps    | 31000    |
| value_loss         | 2.59e-05 |
---------------------------------
---------------------------------
| explained_variance | -77.4    |
| fps                | 924      |
| nupdates           | 6300     |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -1.38    |
| fps                | 959      |
| nupdates           | 9100     |
| policy_entropy     | 2.07     |
| total_timesteps    | 45500    |
| value_loss         | 0.00128  |
---------------------------------
---------------------------------
| explained_variance | -3.57    |
| fps                | 960      |
| nupdates           | 9200     |
| policy_entropy     | 2.07     |
| total_timesteps    | 46000    |
| value_loss         | 0.0013   |
---------------------------------
---------------------------------
| explained_variance | -19.5    |
| fps                | 960      |
| nupdates           | 9300     |
| policy_entropy     | 2.05     |
| total_timesteps    | 46500    |
| value_loss         | 0.000282 |
---------------------------------
---------------------------------
| explained_variance | -24.8    |
| fps                | 959      |
| nupdates           | 9400     |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.16    |
| fps                | 926      |
| nupdates           | 12100    |
| policy_entropy     | 2.07     |
| total_timesteps    | 60500    |
| value_loss         | 0.00135  |
---------------------------------
---------------------------------
| explained_variance | -24.6    |
| fps                | 927      |
| nupdates           | 12200    |
| policy_entropy     | 2.05     |
| total_timesteps    | 61000    |
| value_loss         | 0.00143  |
---------------------------------
---------------------------------
| explained_variance | -371     |
| fps                | 928      |
| nupdates           | 12300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 61500    |
| value_loss         | 0.0631   |
---------------------------------
---------------------------------
| explained_variance | -0.183   |
| fps                | 929      |
| nupdates           | 12400    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.6     |
| fps                | 906      |
| nupdates           | 15100    |
| policy_entropy     | 2.05     |
| total_timesteps    | 75500    |
| value_loss         | 0.000275 |
---------------------------------
---------------------------------
| explained_variance | -14.6    |
| fps                | 907      |
| nupdates           | 15200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 76000    |
| value_loss         | 0.00079  |
---------------------------------
---------------------------------
| explained_variance | -2.16    |
| fps                | 908      |
| nupdates           | 15300    |
| policy_entropy     | 2.06     |
| total_timesteps    | 76500    |
| value_loss         | 0.00339  |
---------------------------------
---------------------------------
| explained_variance | 0.597    |
| fps                | 909      |
| nupdates           | 15400    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -2.1     |
| fps                | 930      |
| nupdates           | 18200    |
| policy_entropy     | 2.06     |
| total_timesteps    | 91000    |
| value_loss         | 9.14e-05 |
---------------------------------
----------------------------------
| explained_variance | -2.79e+03 |
| fps                | 930       |
| nupdates           | 18300     |
| policy_entropy     | 2.05      |
| total_timesteps    | 91500     |
| value_loss         | 0.15      |
----------------------------------
---------------------------------
| explained_variance | 0.842    |
| fps                | 931      |
| nupdates           | 18400    |
| policy_entropy     | 2.04     |
| total_timesteps    | 92000    |
| value_loss         | 0.000227 |
---------------------------------
---------------------------------
| explained_variance | 0.708    |
| fps                | 932      |
| nupdates           | 18500    |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | -102     |
| fps                | 917      |
| nupdates           | 21200    |
| policy_entropy     | 2.05     |
| total_timesteps    | 106000   |
| value_loss         | 0.0238   |
---------------------------------
---------------------------------
| explained_variance | -2.23    |
| fps                | 917      |
| nupdates           | 21300    |
| policy_entropy     | 2.08     |
| total_timesteps    | 106500   |
| value_loss         | 0.00012  |
---------------------------------
---------------------------------
| explained_variance | -2.99    |
| fps                | 918      |
| nupdates           | 21400    |
| policy_entropy     | 2.06     |
| total_timesteps    | 107000   |
| value_loss         | 0.000162 |
---------------------------------
---------------------------------
| explained_variance | 0.0693   |
| fps                | 919      |
| nupdates           | 21500    |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -11.8    |
| fps                | 932      |
| nupdates           | 24300    |
| policy_entropy     | 2.05     |
| total_timesteps    | 121500   |
| value_loss         | 0.000675 |
---------------------------------
---------------------------------
| explained_variance | -1.41    |
| fps                | 933      |
| nupdates           | 24400    |
| policy_entropy     | 2.08     |
| total_timesteps    | 122000   |
| value_loss         | 0.00102  |
---------------------------------
---------------------------------
| explained_variance | -2.21    |
| fps                | 933      |
| nupdates           | 24500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 122500   |
| value_loss         | 0.00017  |
---------------------------------
---------------------------------
| explained_variance | -2.72    |
| fps                | 933      |
| nupdates           | 24600    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.365    |
| fps                | 925      |
| nupdates           | 27300    |
| policy_entropy     | 2.01     |
| total_timesteps    | 136500   |
| value_loss         | 0.0994   |
---------------------------------
---------------------------------
| explained_variance | -1.67    |
| fps                | 925      |
| nupdates           | 27400    |
| policy_entropy     | 2.07     |
| total_timesteps    | 137000   |
| value_loss         | 0.000825 |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 925      |
| nupdates           | 27500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 137500   |
| value_loss         | 5.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.613    |
| fps                | 926      |
| nupdates           | 27600    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.74    |
| fps                | 919      |
| nupdates           | 30300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 151500   |
| value_loss         | 0.00117  |
---------------------------------
---------------------------------
| explained_variance | -0.127   |
| fps                | 919      |
| nupdates           | 30400    |
| policy_entropy     | 2.05     |
| total_timesteps    | 152000   |
| value_loss         | 0.00037  |
---------------------------------
---------------------------------
| explained_variance | 0.427    |
| fps                | 920      |
| nupdates           | 30500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 152500   |
| value_loss         | 0.137    |
---------------------------------
---------------------------------
| explained_variance | 0.806    |
| fps                | 920      |
| nupdates           | 30600    |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.213    |
| fps                | 931      |
| nupdates           | 33400    |
| policy_entropy     | 2.03     |
| total_timesteps    | 167000   |
| value_loss         | 0.000471 |
---------------------------------
---------------------------------
| explained_variance | -44.4    |
| fps                | 931      |
| nupdates           | 33500    |
| policy_entropy     | 2.03     |
| total_timesteps    | 167500   |
| value_loss         | 0.000398 |
---------------------------------
---------------------------------
| explained_variance | 0.895    |
| fps                | 932      |
| nupdates           | 33600    |
| policy_entropy     | 2.05     |
| total_timesteps    | 168000   |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | -27.9    |
| fps                | 932      |
| nupdates           | 33700    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.454    |
| fps                | 924      |
| nupdates           | 36400    |
| policy_entropy     | 2.05     |
| total_timesteps    | 182000   |
| value_loss         | 0.000376 |
---------------------------------
---------------------------------
| explained_variance | -2.81    |
| fps                | 924      |
| nupdates           | 36500    |
| policy_entropy     | 2.07     |
| total_timesteps    | 182500   |
| value_loss         | 0.000693 |
---------------------------------
---------------------------------
| explained_variance | 0.581    |
| fps                | 925      |
| nupdates           | 36600    |
| policy_entropy     | 2.05     |
| total_timesteps    | 183000   |
| value_loss         | 4.67e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.08    |
| fps                | 925      |
| nupdates           | 36700    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.6     |
| fps                | 932      |
| nupdates           | 39500    |
| policy_entropy     | 2.04     |
| total_timesteps    | 197500   |
| value_loss         | 0.000267 |
---------------------------------
---------------------------------
| explained_variance | 0.592    |
| fps                | 933      |
| nupdates           | 39600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 198000   |
| value_loss         | 0.000262 |
---------------------------------
---------------------------------
| explained_variance | 0.777    |
| fps                | 933      |
| nupdates           | 39700    |
| policy_entropy     | 2.01     |
| total_timesteps    | 198500   |
| value_loss         | 3.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.702    |
| fps                | 933      |
| nupdates           | 39800    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.504   |
| fps                | 925      |
| nupdates           | 42500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 212500   |
| value_loss         | 0.000888 |
---------------------------------
---------------------------------
| explained_variance | -4.35    |
| fps                | 925      |
| nupdates           | 42600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 213000   |
| value_loss         | 0.002    |
---------------------------------
---------------------------------
| explained_variance | 0.379    |
| fps                | 925      |
| nupdates           | 42700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 213500   |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | -1.27    |
| fps                | 925      |
| nupdates           | 42800    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.57    |
| fps                | 920      |
| nupdates           | 45500    |
| policy_entropy     | 2.07     |
| total_timesteps    | 227500   |
| value_loss         | 0.000511 |
---------------------------------
---------------------------------
| explained_variance | -11.5    |
| fps                | 920      |
| nupdates           | 45600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 228000   |
| value_loss         | 0.000448 |
---------------------------------
---------------------------------
| explained_variance | -0.524   |
| fps                | 920      |
| nupdates           | 45700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 228500   |
| value_loss         | 0.000425 |
---------------------------------
---------------------------------
| explained_variance | -0.467   |
| fps                | 920      |
| nupdates           | 45800    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.48    |
| fps                | 927      |
| nupdates           | 48600    |
| policy_entropy     | 2.05     |
| total_timesteps    | 243000   |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | 0.131    |
| fps                | 928      |
| nupdates           | 48700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 243500   |
| value_loss         | 0.000393 |
---------------------------------
---------------------------------
| explained_variance | 0.201    |
| fps                | 928      |
| nupdates           | 48800    |
| policy_entropy     | 2.06     |
| total_timesteps    | 244000   |
| value_loss         | 0.000777 |
---------------------------------
---------------------------------
| explained_variance | -0.838   |
| fps                | 928      |
| nupdates           | 48900    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.0581   |
| fps                | 924      |
| nupdates           | 51600    |
| policy_entropy     | 2.01     |
| total_timesteps    | 258000   |
| value_loss         | 0.000165 |
---------------------------------
---------------------------------
| explained_variance | 0.774    |
| fps                | 924      |
| nupdates           | 51700    |
| policy_entropy     | 2.04     |
| total_timesteps    | 258500   |
| value_loss         | 0.000242 |
---------------------------------
---------------------------------
| explained_variance | -0.326   |
| fps                | 924      |
| nupdates           | 51800    |
| policy_entropy     | 2.07     |
| total_timesteps    | 259000   |
| value_loss         | 0.000393 |
---------------------------------
---------------------------------
| explained_variance | -0.835   |
| fps                | 924      |
| nupdates           | 51900    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.464    |
| fps                | 930      |
| nupdates           | 54700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 273500   |
| value_loss         | 0.000244 |
---------------------------------
----------------------------------
| explained_variance | -1.28e+04 |
| fps                | 930       |
| nupdates           | 54800     |
| policy_entropy     | 2.07      |
| total_timesteps    | 274000    |
| value_loss         | 0.146     |
----------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 930      |
| nupdates           | 54900    |
| policy_entropy     | 2.06     |
| total_timesteps    | 274500   |
| value_loss         | 0.000122 |
---------------------------------
Eval num_timesteps=275000, episode_reward=-4.70 +/- 0.46
Episode length: 564.20 +/- 80.02
---------------------------------
| explained_variance | -16.8    |
| fps             

---------------------------------
| explained_variance | 0.849    |
| fps                | 925      |
| nupdates           | 57700    |
| policy_entropy     | 2.02     |
| total_timesteps    | 288500   |
| value_loss         | 0.000467 |
---------------------------------
---------------------------------
| explained_variance | 0.077    |
| fps                | 925      |
| nupdates           | 57800    |
| policy_entropy     | 2        |
| total_timesteps    | 289000   |
| value_loss         | 0.000703 |
---------------------------------
---------------------------------
| explained_variance | -3.25    |
| fps                | 925      |
| nupdates           | 57900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 289500   |
| value_loss         | 8.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -84.9    |
| fps                | 925      |
| nupdates           | 58000    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.683    |
| fps                | 921      |
| nupdates           | 60700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 303500   |
| value_loss         | 2.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.0626   |
| fps                | 921      |
| nupdates           | 60800    |
| policy_entropy     | 2.06     |
| total_timesteps    | 304000   |
| value_loss         | 4.64e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.04    |
| fps                | 922      |
| nupdates           | 60900    |
| policy_entropy     | 2.05     |
| total_timesteps    | 304500   |
| value_loss         | 0.000892 |
---------------------------------
---------------------------------
| explained_variance | -12      |
| fps                | 922      |
| nupdates           | 61000    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0609   |
| fps                | 927      |
| nupdates           | 63800    |
| policy_entropy     | 2.07     |
| total_timesteps    | 319000   |
| value_loss         | 0.000254 |
---------------------------------
---------------------------------
| explained_variance | -1.98    |
| fps                | 927      |
| nupdates           | 63900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 319500   |
| value_loss         | 0.000549 |
---------------------------------
---------------------------------
| explained_variance | -0.457   |
| fps                | 927      |
| nupdates           | 64000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 320000   |
| value_loss         | 0.000401 |
---------------------------------
---------------------------------
| explained_variance | 0.85     |
| fps                | 927      |
| nupdates           | 64100    |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -3.93    |
| fps                | 923      |
| nupdates           | 66800    |
| policy_entropy     | 2.07     |
| total_timesteps    | 334000   |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | -4.17    |
| fps                | 923      |
| nupdates           | 66900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 334500   |
| value_loss         | 0.000976 |
---------------------------------
---------------------------------
| explained_variance | -4.2     |
| fps                | 923      |
| nupdates           | 67000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 335000   |
| value_loss         | 0.000426 |
---------------------------------
---------------------------------
| explained_variance | 0.903    |
| fps                | 923      |
| nupdates           | 67100    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.685    |
| fps                | 929      |
| nupdates           | 69900    |
| policy_entropy     | 2.05     |
| total_timesteps    | 349500   |
| value_loss         | 0.942    |
---------------------------------
Eval num_timesteps=350000, episode_reward=-4.90 +/- 0.30
Episode length: 553.30 +/- 133.57
---------------------------------
| explained_variance | -7.39    |
| fps                | 921      |
| nupdates           | 70000    |
| policy_entropy     | 2.05     |
| total_timesteps    | 350000   |
| value_loss         | 0.000524 |
---------------------------------
---------------------------------
| explained_variance | 0.746    |
| fps                | 921      |
| nupdates           | 70100    |
| policy_entropy     | 2.06     |
| total_timesteps    | 350500   |
| value_loss         | 6.13e-06 |
---------------------------------
---------------------------------
| explained_variance | -724     |
| fps                | 92

---------------------------------
| explained_variance | -13.1    |
| fps                | 926      |
| nupdates           | 72900    |
| policy_entropy     | 2.04     |
| total_timesteps    | 364500   |
| value_loss         | 0.00059  |
---------------------------------
---------------------------------
| explained_variance | -1.2     |
| fps                | 926      |
| nupdates           | 73000    |
| policy_entropy     | 2.03     |
| total_timesteps    | 365000   |
| value_loss         | 0.00183  |
---------------------------------
---------------------------------
| explained_variance | -15      |
| fps                | 926      |
| nupdates           | 73100    |
| policy_entropy     | 2.07     |
| total_timesteps    | 365500   |
| value_loss         | 0.000623 |
---------------------------------
---------------------------------
| explained_variance | 0.757    |
| fps                | 926      |
| nupdates           | 73200    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.165    |
| fps                | 921      |
| nupdates           | 75900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 379500   |
| value_loss         | 6.16e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.23    |
| fps                | 921      |
| nupdates           | 76000    |
| policy_entropy     | 2.04     |
| total_timesteps    | 380000   |
| value_loss         | 0.000495 |
---------------------------------
---------------------------------
| explained_variance | 0.355    |
| fps                | 922      |
| nupdates           | 76100    |
| policy_entropy     | 2.01     |
| total_timesteps    | 380500   |
| value_loss         | 0.1      |
---------------------------------
---------------------------------
| explained_variance | -0.608   |
| fps                | 922      |
| nupdates           | 76200    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0188  |
| fps                | 925      |
| nupdates           | 79000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 395000   |
| value_loss         | 0.201    |
---------------------------------
---------------------------------
| explained_variance | 0.85     |
| fps                | 926      |
| nupdates           | 79100    |
| policy_entropy     | 2.06     |
| total_timesteps    | 395500   |
| value_loss         | 3.21e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 926      |
| nupdates           | 79200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 396000   |
| value_loss         | 8.08e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.759    |
| fps                | 926      |
| nupdates           | 79300    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.783    |
| fps                | 924      |
| nupdates           | 82000    |
| policy_entropy     | 2.07     |
| total_timesteps    | 410000   |
| value_loss         | 9.34e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.586    |
| fps                | 924      |
| nupdates           | 82100    |
| policy_entropy     | 2.06     |
| total_timesteps    | 410500   |
| value_loss         | 7.69e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.987   |
| fps                | 924      |
| nupdates           | 82200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 411000   |
| value_loss         | 0.000174 |
---------------------------------
---------------------------------
| explained_variance | -0.644   |
| fps                | 924      |
| nupdates           | 82300    |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.36     |
| fps                | 922      |
| nupdates           | 85100    |
| policy_entropy     | 2.07     |
| total_timesteps    | 425500   |
| value_loss         | 8.99e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.09    |
| fps                | 922      |
| nupdates           | 85200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 426000   |
| value_loss         | 0.000987 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 922      |
| nupdates           | 85300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 426500   |
| value_loss         | 0.000855 |
---------------------------------
---------------------------------
| explained_variance | -4.65    |
| fps                | 922      |
| nupdates           | 85400    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.801    |
| fps                | 926      |
| nupdates           | 88200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 441000   |
| value_loss         | 0.00097  |
---------------------------------
---------------------------------
| explained_variance | -0.766   |
| fps                | 926      |
| nupdates           | 88300    |
| policy_entropy     | 2.06     |
| total_timesteps    | 441500   |
| value_loss         | 0.000331 |
---------------------------------
---------------------------------
| explained_variance | 0.746    |
| fps                | 926      |
| nupdates           | 88400    |
| policy_entropy     | 2.06     |
| total_timesteps    | 442000   |
| value_loss         | 0.000154 |
---------------------------------
---------------------------------
| explained_variance | 0.66     |
| fps                | 926      |
| nupdates           | 88500    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.495    |
| fps                | 923      |
| nupdates           | 91200    |
| policy_entropy     | 2.06     |
| total_timesteps    | 456000   |
| value_loss         | 5.25e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.9     |
| fps                | 923      |
| nupdates           | 91300    |
| policy_entropy     | 2.06     |
| total_timesteps    | 456500   |
| value_loss         | 0.00145  |
---------------------------------
---------------------------------
| explained_variance | 0.386    |
| fps                | 923      |
| nupdates           | 91400    |
| policy_entropy     | 2.07     |
| total_timesteps    | 457000   |
| value_loss         | 0.146    |
---------------------------------
---------------------------------
| explained_variance | 0.897    |
| fps                | 924      |
| nupdates           | 91500    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.674    |
| fps                | 928      |
| nupdates           | 94300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 471500   |
| value_loss         | 4.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 928      |
| nupdates           | 94400    |
| policy_entropy     | 2.07     |
| total_timesteps    | 472000   |
| value_loss         | 0.00328  |
---------------------------------
---------------------------------
| explained_variance | 0.529    |
| fps                | 928      |
| nupdates           | 94500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 472500   |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.709    |
| fps                | 928      |
| nupdates           | 94600    |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.542   |
| fps                | 927      |
| nupdates           | 97300    |
| policy_entropy     | 2.06     |
| total_timesteps    | 486500   |
| value_loss         | 0.00061  |
---------------------------------
---------------------------------
| explained_variance | -0.908   |
| fps                | 927      |
| nupdates           | 97400    |
| policy_entropy     | 2.03     |
| total_timesteps    | 487000   |
| value_loss         | 0.00126  |
---------------------------------
---------------------------------
| explained_variance | -10.5    |
| fps                | 927      |
| nupdates           | 97500    |
| policy_entropy     | 2.08     |
| total_timesteps    | 487500   |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | 0.783    |
| fps                | 927      |
| nupdates           | 97600    |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -4.02    |
| fps                | 924      |
| nupdates           | 100300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 501500   |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | -3.05    |
| fps                | 925      |
| nupdates           | 100400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 502000   |
| value_loss         | 0.00105  |
---------------------------------
---------------------------------
| explained_variance | -4.82    |
| fps                | 925      |
| nupdates           | 100500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 502500   |
| value_loss         | 0.000367 |
---------------------------------
---------------------------------
| explained_variance | 0.00749  |
| fps                | 925      |
| nupdates           | 100600   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.799   |
| fps                | 929      |
| nupdates           | 103400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 517000   |
| value_loss         | 5.28e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.307   |
| fps                | 929      |
| nupdates           | 103500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 517500   |
| value_loss         | 0.000357 |
---------------------------------
---------------------------------
| explained_variance | 0.355    |
| fps                | 929      |
| nupdates           | 103600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 518000   |
| value_loss         | 0.000154 |
---------------------------------
---------------------------------
| explained_variance | 0.512    |
| fps                | 929      |
| nupdates           | 103700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -50.9    |
| fps                | 927      |
| nupdates           | 106400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 532000   |
| value_loss         | 0.00585  |
---------------------------------
---------------------------------
| explained_variance | -1.8     |
| fps                | 927      |
| nupdates           | 106500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 532500   |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | 0.328    |
| fps                | 927      |
| nupdates           | 106600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 533000   |
| value_loss         | 0.195    |
---------------------------------
---------------------------------
| explained_variance | 0.297    |
| fps                | 928      |
| nupdates           | 106700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0981   |
| fps                | 931      |
| nupdates           | 109500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 547500   |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | 0.652    |
| fps                | 931      |
| nupdates           | 109600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 548000   |
| value_loss         | 0.000221 |
---------------------------------
---------------------------------
| explained_variance | 0.92     |
| fps                | 931      |
| nupdates           | 109700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 548500   |
| value_loss         | 0.00017  |
---------------------------------
---------------------------------
| explained_variance | -2.69    |
| fps                | 931      |
| nupdates           | 109800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.603    |
| fps                | 930      |
| nupdates           | 112500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 562500   |
| value_loss         | 9.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.23     |
| fps                | 930      |
| nupdates           | 112600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 563000   |
| value_loss         | 0.000321 |
---------------------------------
---------------------------------
| explained_variance | 0.433    |
| fps                | 930      |
| nupdates           | 112700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 563500   |
| value_loss         | 7.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.657    |
| fps                | 930      |
| nupdates           | 112800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.851    |
| fps                | 928      |
| nupdates           | 115500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 577500   |
| value_loss         | 1.3e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.0894   |
| fps                | 928      |
| nupdates           | 115600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 578000   |
| value_loss         | 0.000365 |
---------------------------------
---------------------------------
| explained_variance | 0.846    |
| fps                | 928      |
| nupdates           | 115700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 578500   |
| value_loss         | 5.2e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.644    |
| fps                | 928      |
| nupdates           | 115800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.889    |
| fps                | 931      |
| nupdates           | 118600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 593000   |
| value_loss         | 8.15e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.6      |
| fps                | 931      |
| nupdates           | 118700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 593500   |
| value_loss         | 0.00017  |
---------------------------------
---------------------------------
| explained_variance | -4.66    |
| fps                | 931      |
| nupdates           | 118800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 594000   |
| value_loss         | 8.19e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.07    |
| fps                | 931      |
| nupdates           | 118900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.756   |
| fps                | 929      |
| nupdates           | 121600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 608000   |
| value_loss         | 0.000774 |
---------------------------------
---------------------------------
| explained_variance | -2.53    |
| fps                | 929      |
| nupdates           | 121700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 608500   |
| value_loss         | 4.64e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.822   |
| fps                | 929      |
| nupdates           | 121800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 609000   |
| value_loss         | 0.00107  |
---------------------------------
---------------------------------
| explained_variance | 0.606    |
| fps                | 929      |
| nupdates           | 121900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.992    |
| fps                | 933      |
| nupdates           | 124700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 623500   |
| value_loss         | 1.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.592    |
| fps                | 933      |
| nupdates           | 124800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 624000   |
| value_loss         | 3.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.216    |
| fps                | 933      |
| nupdates           | 124900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 624500   |
| value_loss         | 0.000246 |
---------------------------------
Eval num_timesteps=625000, episode_reward=-4.90 +/- 0.30
Episode length: 629.70 +/- 85.29
---------------------------------
| explained_variance | 0.554    |
| fps                | 928

---------------------------------
| explained_variance | -9.32    |
| fps                | 931      |
| nupdates           | 127700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 638500   |
| value_loss         | 0.000209 |
---------------------------------
---------------------------------
| explained_variance | 0.0542   |
| fps                | 931      |
| nupdates           | 127800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 639000   |
| value_loss         | 0.000349 |
---------------------------------
---------------------------------
| explained_variance | -0.319   |
| fps                | 931      |
| nupdates           | 127900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 639500   |
| value_loss         | 0.000509 |
---------------------------------
---------------------------------
| explained_variance | 0.0419   |
| fps                | 931      |
| nupdates           | 128000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -3.19    |
| fps                | 929      |
| nupdates           | 130700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 653500   |
| value_loss         | 0.000305 |
---------------------------------
---------------------------------
| explained_variance | 0.89     |
| fps                | 929      |
| nupdates           | 130800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 654000   |
| value_loss         | 3.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.571    |
| fps                | 929      |
| nupdates           | 130900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 654500   |
| value_loss         | 0.000152 |
---------------------------------
---------------------------------
| explained_variance | -2.35    |
| fps                | 929      |
| nupdates           | 131000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -31      |
| fps                | 932      |
| nupdates           | 133800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 669000   |
| value_loss         | 0.00197  |
---------------------------------
---------------------------------
| explained_variance | 0.95     |
| fps                | 932      |
| nupdates           | 133900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 669500   |
| value_loss         | 1.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.948    |
| fps                | 932      |
| nupdates           | 134000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 670000   |
| value_loss         | 5.22e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.987    |
| fps                | 932      |
| nupdates           | 134100   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -1.91    |
| fps                | 930      |
| nupdates           | 136800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 684000   |
| value_loss         | 0.000186 |
---------------------------------
---------------------------------
| explained_variance | 0.771    |
| fps                | 930      |
| nupdates           | 136900   |
| policy_entropy     | 2.02     |
| total_timesteps    | 684500   |
| value_loss         | 0.00193  |
---------------------------------
---------------------------------
| explained_variance | 0.949    |
| fps                | 931      |
| nupdates           | 137000   |
| policy_entropy     | 1.99     |
| total_timesteps    | 685000   |
| value_loss         | 2.08e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.333   |
| fps                | 931      |
| nupdates           | 137100   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.766   |
| fps                | 933      |
| nupdates           | 139900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 699500   |
| value_loss         | 0.00018  |
---------------------------------
Eval num_timesteps=700000, episode_reward=-4.90 +/- 0.30
Episode length: 598.00 +/- 111.90
---------------------------------
| explained_variance | 0.201    |
| fps                | 929      |
| nupdates           | 140000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 700000   |
| value_loss         | 0.000495 |
---------------------------------
---------------------------------
| explained_variance | -0.147   |
| fps                | 929      |
| nupdates           | 140100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 700500   |
| value_loss         | 0.000215 |
---------------------------------
---------------------------------
| explained_variance | 0.917    |
| fps                | 92

---------------------------------
| explained_variance | -5.24    |
| fps                | 932      |
| nupdates           | 142900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 714500   |
| value_loss         | 0.0012   |
---------------------------------
---------------------------------
| explained_variance | 0.477    |
| fps                | 932      |
| nupdates           | 143000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 715000   |
| value_loss         | 9.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0367   |
| fps                | 932      |
| nupdates           | 143100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 715500   |
| value_loss         | 0.000181 |
---------------------------------
---------------------------------
| explained_variance | -1.22    |
| fps                | 932      |
| nupdates           | 143200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -11.4    |
| fps                | 931      |
| nupdates           | 145900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 729500   |
| value_loss         | 0.00115  |
---------------------------------
---------------------------------
| explained_variance | -1.93    |
| fps                | 931      |
| nupdates           | 146000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 730000   |
| value_loss         | 1.36e-05 |
---------------------------------
---------------------------------
| explained_variance | -14.6    |
| fps                | 932      |
| nupdates           | 146100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 730500   |
| value_loss         | 0.000198 |
---------------------------------
---------------------------------
| explained_variance | 0.0294   |
| fps                | 932      |
| nupdates           | 146200   |
| policy_entropy     | 1.98     |
| total_timest

---------------------------------
| explained_variance | -7.02    |
| fps                | 934      |
| nupdates           | 149000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 745000   |
| value_loss         | 0.00117  |
---------------------------------
---------------------------------
| explained_variance | -1.52    |
| fps                | 934      |
| nupdates           | 149100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 745500   |
| value_loss         | 0.00181  |
---------------------------------
---------------------------------
| explained_variance | 0.0541   |
| fps                | 934      |
| nupdates           | 149200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 746000   |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.437    |
| fps                | 934      |
| nupdates           | 149300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.623    |
| fps                | 932      |
| nupdates           | 152000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 760000   |
| value_loss         | 9.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0183  |
| fps                | 933      |
| nupdates           | 152100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 760500   |
| value_loss         | 0.0001   |
---------------------------------
---------------------------------
| explained_variance | 0.437    |
| fps                | 933      |
| nupdates           | 152200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 761000   |
| value_loss         | 0.000137 |
---------------------------------
---------------------------------
| explained_variance | 0.889    |
| fps                | 933      |
| nupdates           | 152300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.613    |
| fps                | 931      |
| nupdates           | 155100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 775500   |
| value_loss         | 1e-05    |
---------------------------------
---------------------------------
| explained_variance | -2.41    |
| fps                | 932      |
| nupdates           | 155200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 776000   |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | 0.24     |
| fps                | 932      |
| nupdates           | 155300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 776500   |
| value_loss         | 5.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 932      |
| nupdates           | 155400   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.678    |
| fps                | 934      |
| nupdates           | 158200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 791000   |
| value_loss         | 0.000864 |
---------------------------------
---------------------------------
| explained_variance | -11      |
| fps                | 934      |
| nupdates           | 158300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 791500   |
| value_loss         | 0.000432 |
---------------------------------
---------------------------------
| explained_variance | 0.845    |
| fps                | 934      |
| nupdates           | 158400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 792000   |
| value_loss         | 3.02e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.29    |
| fps                | 934      |
| nupdates           | 158500   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.921    |
| fps                | 933      |
| nupdates           | 161200   |
| policy_entropy     | 1.73     |
| total_timesteps    | 806000   |
| value_loss         | 0.955    |
---------------------------------
---------------------------------
| explained_variance | -1.56    |
| fps                | 933      |
| nupdates           | 161300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 806500   |
| value_loss         | 9.01e-05 |
---------------------------------
---------------------------------
| explained_variance | -6.23    |
| fps                | 934      |
| nupdates           | 161400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 807000   |
| value_loss         | 0.0158   |
---------------------------------
---------------------------------
| explained_variance | 0.822    |
| fps                | 934      |
| nupdates           | 161500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.698    |
| fps                | 936      |
| nupdates           | 164300   |
| policy_entropy     | 2.03     |
| total_timesteps    | 821500   |
| value_loss         | 0.000154 |
---------------------------------
----------------------------------
| explained_variance | -2.59e+03 |
| fps                | 936       |
| nupdates           | 164400    |
| policy_entropy     | 2.06      |
| total_timesteps    | 822000    |
| value_loss         | 0.0843    |
----------------------------------
---------------------------------
| explained_variance | 0.35     |
| fps                | 936      |
| nupdates           | 164500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 822500   |
| value_loss         | 0.000285 |
---------------------------------
---------------------------------
| explained_variance | -0.867   |
| fps                | 936      |
| nupdates           | 164600   |
| policy_entropy     | 2.07     |
| tota

---------------------------------
| explained_variance | -0.104   |
| fps                | 934      |
| nupdates           | 167300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 836500   |
| value_loss         | 0.000349 |
---------------------------------
---------------------------------
| explained_variance | 0.793    |
| fps                | 934      |
| nupdates           | 167400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 837000   |
| value_loss         | 7.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.289   |
| fps                | 934      |
| nupdates           | 167500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 837500   |
| value_loss         | 0.000172 |
---------------------------------
---------------------------------
| explained_variance | 0.142    |
| fps                | 934      |
| nupdates           | 167600   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.35    |
| fps                | 933      |
| nupdates           | 170300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 851500   |
| value_loss         | 0.00151  |
---------------------------------
---------------------------------
| explained_variance | -2.48    |
| fps                | 933      |
| nupdates           | 170400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 852000   |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | 0.0887   |
| fps                | 933      |
| nupdates           | 170500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 852500   |
| value_loss         | 0.000282 |
---------------------------------
---------------------------------
| explained_variance | -0.169   |
| fps                | 933      |
| nupdates           | 170600   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.523   |
| fps                | 935      |
| nupdates           | 173400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 867000   |
| value_loss         | 4.34e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.37    |
| fps                | 935      |
| nupdates           | 173500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 867500   |
| value_loss         | 0.00184  |
---------------------------------
---------------------------------
| explained_variance | -2.14    |
| fps                | 935      |
| nupdates           | 173600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 868000   |
| value_loss         | 0.000771 |
---------------------------------
---------------------------------
| explained_variance | 0.163    |
| fps                | 935      |
| nupdates           | 173700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -6.36    |
| fps                | 933      |
| nupdates           | 176400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 882000   |
| value_loss         | 0.00108  |
---------------------------------
---------------------------------
| explained_variance | 0.939    |
| fps                | 933      |
| nupdates           | 176500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 882500   |
| value_loss         | 2.46e-05 |
---------------------------------
---------------------------------
| explained_variance | -34.2    |
| fps                | 934      |
| nupdates           | 176600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 883000   |
| value_loss         | 0.00155  |
---------------------------------
---------------------------------
| explained_variance | -0.0322  |
| fps                | 934      |
| nupdates           | 176700   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -6.48    |
| fps                | 936      |
| nupdates           | 179500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 897500   |
| value_loss         | 8.4e-05  |
---------------------------------
---------------------------------
| explained_variance | -11.8    |
| fps                | 936      |
| nupdates           | 179600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 898000   |
| value_loss         | 0.000193 |
---------------------------------
---------------------------------
| explained_variance | 0.392    |
| fps                | 936      |
| nupdates           | 179700   |
| policy_entropy     | 1.98     |
| total_timesteps    | 898500   |
| value_loss         | 0.157    |
---------------------------------
---------------------------------
| explained_variance | 0.592    |
| fps                | 936      |
| nupdates           | 179800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.606    |
| fps                | 935      |
| nupdates           | 182500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 912500   |
| value_loss         | 7.7e-05  |
---------------------------------
---------------------------------
| explained_variance | -1.46    |
| fps                | 935      |
| nupdates           | 182600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 913000   |
| value_loss         | 0.000197 |
---------------------------------
---------------------------------
| explained_variance | -2.23    |
| fps                | 935      |
| nupdates           | 182700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 913500   |
| value_loss         | 0.000165 |
---------------------------------
---------------------------------
| explained_variance | 0.354    |
| fps                | 935      |
| nupdates           | 182800   |
| policy_entropy     | 1.98     |
| total_timest

---------------------------------
| explained_variance | 0.786    |
| fps                | 934      |
| nupdates           | 185500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 927500   |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | -0.0837  |
| fps                | 934      |
| nupdates           | 185600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 928000   |
| value_loss         | 0.000448 |
---------------------------------
---------------------------------
| explained_variance | 0.44     |
| fps                | 934      |
| nupdates           | 185700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 928500   |
| value_loss         | 0.00055  |
---------------------------------
---------------------------------
| explained_variance | -2.62    |
| fps                | 934      |
| nupdates           | 185800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.819    |
| fps                | 936      |
| nupdates           | 188600   |
| policy_entropy     | 2        |
| total_timesteps    | 943000   |
| value_loss         | 6.79e-05 |
---------------------------------
---------------------------------
| explained_variance | -1e+03   |
| fps                | 936      |
| nupdates           | 188700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 943500   |
| value_loss         | 0.0754   |
---------------------------------
---------------------------------
| explained_variance | 0.748    |
| fps                | 936      |
| nupdates           | 188800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 944000   |
| value_loss         | 0.000683 |
---------------------------------
---------------------------------
| explained_variance | -0.406   |
| fps                | 936      |
| nupdates           | 188900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -1.18    |
| fps                | 935      |
| nupdates           | 191600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 958000   |
| value_loss         | 0.000568 |
---------------------------------
---------------------------------
| explained_variance | 0.326    |
| fps                | 935      |
| nupdates           | 191700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 958500   |
| value_loss         | 7.46e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.02    |
| fps                | 935      |
| nupdates           | 191800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 959000   |
| value_loss         | 7.48e-05 |
---------------------------------
---------------------------------
| explained_variance | -969     |
| fps                | 935      |
| nupdates           | 191900   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.696    |
| fps                | 937      |
| nupdates           | 194700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 973500   |
| value_loss         | 7.55e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.313    |
| fps                | 937      |
| nupdates           | 194800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 974000   |
| value_loss         | 2.36e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.196    |
| fps                | 937      |
| nupdates           | 194900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 974500   |
| value_loss         | 0.000476 |
---------------------------------
Eval num_timesteps=975000, episode_reward=-4.70 +/- 0.46
Episode length: 607.30 +/- 154.23
---------------------------------
| explained_variance | 0.605    |
| fps                | 93

---------------------------------
| explained_variance | -0.156   |
| fps                | 936      |
| nupdates           | 197700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 988500   |
| value_loss         | 0.000267 |
---------------------------------
---------------------------------
| explained_variance | -2.58    |
| fps                | 936      |
| nupdates           | 197800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 989000   |
| value_loss         | 0.000616 |
---------------------------------
---------------------------------
| explained_variance | -1.13    |
| fps                | 936      |
| nupdates           | 197900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 989500   |
| value_loss         | 0.000134 |
---------------------------------
---------------------------------
| explained_variance | -0.436   |
| fps                | 937      |
| nupdates           | 198000   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -32.8    |
| fps                | 936      |
| nupdates           | 200700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1003500  |
| value_loss         | 0.00131  |
---------------------------------
---------------------------------
| explained_variance | 0.66     |
| fps                | 936      |
| nupdates           | 200800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1004000  |
| value_loss         | 8e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.907    |
| fps                | 936      |
| nupdates           | 200900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1004500  |
| value_loss         | 1.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.339    |
| fps                | 936      |
| nupdates           | 201000   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.156   |
| fps                | 938      |
| nupdates           | 203800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1019000  |
| value_loss         | 8.07e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.278    |
| fps                | 938      |
| nupdates           | 203900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1019500  |
| value_loss         | 6.34e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.55    |
| fps                | 938      |
| nupdates           | 204000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1020000  |
| value_loss         | 0.000319 |
---------------------------------
---------------------------------
| explained_variance | 0.737    |
| fps                | 938      |
| nupdates           | 204100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -4.09    |
| fps                | 937      |
| nupdates           | 206800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1034000  |
| value_loss         | 0.00222  |
---------------------------------
---------------------------------
| explained_variance | -0.842   |
| fps                | 937      |
| nupdates           | 206900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1034500  |
| value_loss         | 0.000264 |
---------------------------------
---------------------------------
| explained_variance | 0.586    |
| fps                | 937      |
| nupdates           | 207000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1035000  |
| value_loss         | 3.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.345    |
| fps                | 937      |
| nupdates           | 207100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.159    |
| fps                | 939      |
| nupdates           | 209900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1049500  |
| value_loss         | 0.000762 |
---------------------------------
Eval num_timesteps=1050000, episode_reward=-4.60 +/- 0.66
Episode length: 612.20 +/- 67.48
---------------------------------
| explained_variance | 0.799    |
| fps                | 936      |
| nupdates           | 210000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1050000  |
| value_loss         | 3.39e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.774    |
| fps                | 936      |
| nupdates           | 210100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1050500  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | -20.9    |
| fps                | 93

---------------------------------
| explained_variance | 0.982    |
| fps                | 937      |
| nupdates           | 212900   |
| policy_entropy     | 2        |
| total_timesteps    | 1064500  |
| value_loss         | 3.49e-05 |
---------------------------------
---------------------------------
| explained_variance | -208     |
| fps                | 937      |
| nupdates           | 213000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1065000  |
| value_loss         | 0.0442   |
---------------------------------
---------------------------------
| explained_variance | -1.33    |
| fps                | 937      |
| nupdates           | 213100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1065500  |
| value_loss         | 4.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.274    |
| fps                | 937      |
| nupdates           | 213200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.19    |
| fps                | 934      |
| nupdates           | 215900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1079500  |
| value_loss         | 0.00156  |
---------------------------------
---------------------------------
| explained_variance | -19      |
| fps                | 934      |
| nupdates           | 216000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1080000  |
| value_loss         | 0.00106  |
---------------------------------
---------------------------------
| explained_variance | -0.247   |
| fps                | 934      |
| nupdates           | 216100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1080500  |
| value_loss         | 0.000374 |
---------------------------------
---------------------------------
| explained_variance | 0.766    |
| fps                | 934      |
| nupdates           | 216200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -196     |
| fps                | 935      |
| nupdates           | 219000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1095000  |
| value_loss         | 0.00499  |
---------------------------------
---------------------------------
| explained_variance | -2.79    |
| fps                | 935      |
| nupdates           | 219100   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1095500  |
| value_loss         | 0.00189  |
---------------------------------
---------------------------------
| explained_variance | -10.7    |
| fps                | 935      |
| nupdates           | 219200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1096000  |
| value_loss         | 0.00025  |
---------------------------------
---------------------------------
| explained_variance | 0.988    |
| fps                | 935      |
| nupdates           | 219300   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -3.91    |
| fps                | 932      |
| nupdates           | 222000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1110000  |
| value_loss         | 7.25e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.46    |
| fps                | 932      |
| nupdates           | 222100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1110500  |
| value_loss         | 0.000765 |
---------------------------------
---------------------------------
| explained_variance | 0.653    |
| fps                | 932      |
| nupdates           | 222200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1111000  |
| value_loss         | 0.000221 |
---------------------------------
---------------------------------
| explained_variance | 0.653    |
| fps                | 932      |
| nupdates           | 222300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.66    |
| fps                | 930      |
| nupdates           | 225100   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1125500  |
| value_loss         | 0.00127  |
---------------------------------
---------------------------------
| explained_variance | -7.26    |
| fps                | 931      |
| nupdates           | 225200   |
| policy_entropy     | 1.99     |
| total_timesteps    | 1126000  |
| value_loss         | 0.00296  |
---------------------------------
---------------------------------
| explained_variance | 0.168    |
| fps                | 931      |
| nupdates           | 225300   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1126500  |
| value_loss         | 0.000412 |
---------------------------------
---------------------------------
| explained_variance | -5.08    |
| fps                | 931      |
| nupdates           | 225400   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.984    |
| fps                | 932      |
| nupdates           | 228200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1141000  |
| value_loss         | 1.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.99    |
| fps                | 932      |
| nupdates           | 228300   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1141500  |
| value_loss         | 0.000123 |
---------------------------------
---------------------------------
| explained_variance | 0.735    |
| fps                | 932      |
| nupdates           | 228400   |
| policy_entropy     | 1.88     |
| total_timesteps    | 1142000  |
| value_loss         | 0.000288 |
---------------------------------
---------------------------------
| explained_variance | 0.264    |
| fps                | 932      |
| nupdates           | 228500   |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | 0.691    |
| fps                | 929      |
| nupdates           | 231200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1156000  |
| value_loss         | 4.72e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.67    |
| fps                | 930      |
| nupdates           | 231300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1156500  |
| value_loss         | 0.000137 |
---------------------------------
---------------------------------
| explained_variance | -2.65    |
| fps                | 930      |
| nupdates           | 231400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1157000  |
| value_loss         | 0.000332 |
---------------------------------
---------------------------------
| explained_variance | -2.67    |
| fps                | 930      |
| nupdates           | 231500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.567    |
| fps                | 930      |
| nupdates           | 234300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1171500  |
| value_loss         | 2.77e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.773   |
| fps                | 930      |
| nupdates           | 234400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1172000  |
| value_loss         | 6.05e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.417    |
| fps                | 930      |
| nupdates           | 234500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1172500  |
| value_loss         | 2.38e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.58    |
| fps                | 930      |
| nupdates           | 234600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.505    |
| fps                | 928      |
| nupdates           | 237300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1186500  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.849    |
| fps                | 928      |
| nupdates           | 237400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1187000  |
| value_loss         | 0.000522 |
---------------------------------
---------------------------------
| explained_variance | 0.274    |
| fps                | 928      |
| nupdates           | 237500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1187500  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | 0.536    |
| fps                | 928      |
| nupdates           | 237600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.0312  |
| fps                | 926      |
| nupdates           | 240300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1201500  |
| value_loss         | 0.000536 |
---------------------------------
---------------------------------
| explained_variance | -2.17    |
| fps                | 926      |
| nupdates           | 240400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1202000  |
| value_loss         | 5.47e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.39    |
| fps                | 926      |
| nupdates           | 240500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1202500  |
| value_loss         | 0.000667 |
---------------------------------
---------------------------------
| explained_variance | 0.742    |
| fps                | 926      |
| nupdates           | 240600   |
| policy_entropy     | 1.99     |
| total_timest

---------------------------------
| explained_variance | -2.61    |
| fps                | 927      |
| nupdates           | 243400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1217000  |
| value_loss         | 0.000616 |
---------------------------------
---------------------------------
| explained_variance | 0.809    |
| fps                | 927      |
| nupdates           | 243500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1217500  |
| value_loss         | 0.000193 |
---------------------------------
---------------------------------
| explained_variance | -1.47    |
| fps                | 927      |
| nupdates           | 243600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1218000  |
| value_loss         | 0.000158 |
---------------------------------
---------------------------------
| explained_variance | -0.0178  |
| fps                | 927      |
| nupdates           | 243700   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.52    |
| fps                | 926      |
| nupdates           | 246400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1232000  |
| value_loss         | 0.000901 |
---------------------------------
---------------------------------
| explained_variance | -0.649   |
| fps                | 926      |
| nupdates           | 246500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1232500  |
| value_loss         | 0.000112 |
---------------------------------
---------------------------------
| explained_variance | 0.159    |
| fps                | 926      |
| nupdates           | 246600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1233000  |
| value_loss         | 0.00121  |
---------------------------------
---------------------------------
| explained_variance | 0.527    |
| fps                | 926      |
| nupdates           | 246700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -5.06    |
| fps                | 927      |
| nupdates           | 249500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1247500  |
| value_loss         | 0.00112  |
---------------------------------
---------------------------------
| explained_variance | 0.336    |
| fps                | 927      |
| nupdates           | 249600   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1248000  |
| value_loss         | 0.104    |
---------------------------------
---------------------------------
| explained_variance | 0.913    |
| fps                | 927      |
| nupdates           | 249700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1248500  |
| value_loss         | 5.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0762   |
| fps                | 927      |
| nupdates           | 249800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.305   |
| fps                | 926      |
| nupdates           | 252500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1262500  |
| value_loss         | 7.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.388    |
| fps                | 927      |
| nupdates           | 252600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1263000  |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | -0.595   |
| fps                | 927      |
| nupdates           | 252700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1263500  |
| value_loss         | 9.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.898    |
| fps                | 927      |
| nupdates           | 252800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.426    |
| fps                | 925      |
| nupdates           | 255500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1277500  |
| value_loss         | 0.000729 |
---------------------------------
---------------------------------
| explained_variance | 0.0752   |
| fps                | 925      |
| nupdates           | 255600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1278000  |
| value_loss         | 0.000285 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 925      |
| nupdates           | 255700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1278500  |
| value_loss         | 0.000167 |
---------------------------------
---------------------------------
| explained_variance | 0.428    |
| fps                | 925      |
| nupdates           | 255800   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.0388   |
| fps                | 926      |
| nupdates           | 258600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1293000  |
| value_loss         | 3.55e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 926      |
| nupdates           | 258700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1293500  |
| value_loss         | 5.44e-05 |
---------------------------------
---------------------------------
| explained_variance | -20.1    |
| fps                | 926      |
| nupdates           | 258800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1294000  |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | -24.4    |
| fps                | 926      |
| nupdates           | 258900   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.462    |
| fps                | 925      |
| nupdates           | 261600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1308000  |
| value_loss         | 0.000323 |
---------------------------------
---------------------------------
| explained_variance | -0.803   |
| fps                | 925      |
| nupdates           | 261700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1308500  |
| value_loss         | 0.000372 |
---------------------------------
---------------------------------
| explained_variance | 0.546    |
| fps                | 925      |
| nupdates           | 261800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1309000  |
| value_loss         | 6.67e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.72    |
| fps                | 925      |
| nupdates           | 261900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.92     |
| fps                | 925      |
| nupdates           | 264700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1323500  |
| value_loss         | 0.000174 |
---------------------------------
---------------------------------
| explained_variance | -0.0631  |
| fps                | 925      |
| nupdates           | 264800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1324000  |
| value_loss         | 2.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.41    |
| fps                | 925      |
| nupdates           | 264900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1324500  |
| value_loss         | 6.39e-05 |
---------------------------------
Eval num_timesteps=1325000, episode_reward=-5.00 +/- 0.00
Episode length: 536.50 +/- 80.40
---------------------------------
| explained_variance | 0.967    |
| fps                | 92

---------------------------------
| explained_variance | 0.657    |
| fps                | 924      |
| nupdates           | 267700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1338500  |
| value_loss         | 0.000941 |
---------------------------------
---------------------------------
| explained_variance | -0.194   |
| fps                | 924      |
| nupdates           | 267800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1339000  |
| value_loss         | 0.000258 |
---------------------------------
---------------------------------
| explained_variance | -4.09    |
| fps                | 924      |
| nupdates           | 267900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1339500  |
| value_loss         | 0.000147 |
---------------------------------
---------------------------------
| explained_variance | -0.743   |
| fps                | 924      |
| nupdates           | 268000   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.909    |
| fps                | 923      |
| nupdates           | 270700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1353500  |
| value_loss         | 2.38e-06 |
---------------------------------
---------------------------------
| explained_variance | -10.4    |
| fps                | 923      |
| nupdates           | 270800   |
| policy_entropy     | 2.01     |
| total_timesteps    | 1354000  |
| value_loss         | 0.00084  |
---------------------------------
---------------------------------
| explained_variance | 0.803    |
| fps                | 923      |
| nupdates           | 270900   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1354500  |
| value_loss         | 0.000455 |
---------------------------------
---------------------------------
| explained_variance | 0.189    |
| fps                | 923      |
| nupdates           | 271000   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.895    |
| fps                | 924      |
| nupdates           | 273800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1369000  |
| value_loss         | 0.000532 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 924      |
| nupdates           | 273900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1369500  |
| value_loss         | 5.75e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.65    |
| fps                | 924      |
| nupdates           | 274000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1370000  |
| value_loss         | 0.00162  |
---------------------------------
---------------------------------
| explained_variance | 0.353    |
| fps                | 924      |
| nupdates           | 274100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.94    |
| fps                | 924      |
| nupdates           | 276800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1384000  |
| value_loss         | 3e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.439    |
| fps                | 924      |
| nupdates           | 276900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1384500  |
| value_loss         | 0.000136 |
---------------------------------
---------------------------------
| explained_variance | -0.406   |
| fps                | 924      |
| nupdates           | 277000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1385000  |
| value_loss         | 0.000195 |
---------------------------------
---------------------------------
| explained_variance | -3.38    |
| fps                | 924      |
| nupdates           | 277100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.414   |
| fps                | 925      |
| nupdates           | 279900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1399500  |
| value_loss         | 0.000433 |
---------------------------------
Eval num_timesteps=1400000, episode_reward=-4.90 +/- 0.30
Episode length: 555.80 +/- 88.60
---------------------------------
| explained_variance | -1.09    |
| fps                | 923      |
| nupdates           | 280000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1400000  |
| value_loss         | 0.000682 |
---------------------------------
---------------------------------
| explained_variance | 0.964    |
| fps                | 923      |
| nupdates           | 280100   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1400500  |
| value_loss         | 8.36e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.702    |
| fps                | 92

---------------------------------
| explained_variance | -5.06    |
| fps                | 924      |
| nupdates           | 282900   |
| policy_entropy     | 1.82     |
| total_timesteps    | 1414500  |
| value_loss         | 0.00243  |
---------------------------------
---------------------------------
| explained_variance | 0.239    |
| fps                | 924      |
| nupdates           | 283000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1415000  |
| value_loss         | 0.145    |
---------------------------------
---------------------------------
| explained_variance | -0.391   |
| fps                | 924      |
| nupdates           | 283100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1415500  |
| value_loss         | 0.000599 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 924      |
| nupdates           | 283200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.975    |
| fps                | 923      |
| nupdates           | 285900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1429500  |
| value_loss         | 1.98e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.887    |
| fps                | 923      |
| nupdates           | 286000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1430000  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | 0.661    |
| fps                | 923      |
| nupdates           | 286100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1430500  |
| value_loss         | 0.000183 |
---------------------------------
---------------------------------
| explained_variance | 0.618    |
| fps                | 923      |
| nupdates           | 286200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.9e+04 |
| fps                | 924      |
| nupdates           | 289000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1445000  |
| value_loss         | 0.179    |
---------------------------------
---------------------------------
| explained_variance | 0.974    |
| fps                | 924      |
| nupdates           | 289100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1445500  |
| value_loss         | 9.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.23    |
| fps                | 924      |
| nupdates           | 289200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1446000  |
| value_loss         | 0.0142   |
---------------------------------
---------------------------------
| explained_variance | 0.359    |
| fps                | 924      |
| nupdates           | 289300   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.0956   |
| fps                | 922      |
| nupdates           | 292000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1460000  |
| value_loss         | 0.000973 |
---------------------------------
---------------------------------
| explained_variance | 0.161    |
| fps                | 922      |
| nupdates           | 292100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1460500  |
| value_loss         | 7.37e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0343   |
| fps                | 922      |
| nupdates           | 292200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1461000  |
| value_loss         | 3.15e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.98    |
| fps                | 922      |
| nupdates           | 292300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.39     |
| fps                | 920      |
| nupdates           | 295100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1475500  |
| value_loss         | 8.57e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.752    |
| fps                | 920      |
| nupdates           | 295200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1476000  |
| value_loss         | 5.39e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.915    |
| fps                | 920      |
| nupdates           | 295300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1476500  |
| value_loss         | 5.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.34     |
| fps                | 920      |
| nupdates           | 295400   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.945    |
| fps                | 920      |
| nupdates           | 298200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1491000  |
| value_loss         | 0.000112 |
---------------------------------
---------------------------------
| explained_variance | 0.669    |
| fps                | 920      |
| nupdates           | 298300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1491500  |
| value_loss         | 0.000887 |
---------------------------------
---------------------------------
| explained_variance | 0.519    |
| fps                | 920      |
| nupdates           | 298400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1492000  |
| value_loss         | 0.000179 |
---------------------------------
---------------------------------
| explained_variance | 0.37     |
| fps                | 920      |
| nupdates           | 298500   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.26    |
| fps                | 918      |
| nupdates           | 301200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1506000  |
| value_loss         | 0.000267 |
---------------------------------
---------------------------------
| explained_variance | -3.07    |
| fps                | 918      |
| nupdates           | 301300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1506500  |
| value_loss         | 8.14e-05 |
---------------------------------
---------------------------------
| explained_variance | -9.89    |
| fps                | 918      |
| nupdates           | 301400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1507000  |
| value_loss         | 0.00106  |
---------------------------------
---------------------------------
| explained_variance | 0.952    |
| fps                | 918      |
| nupdates           | 301500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.0291  |
| fps                | 917      |
| nupdates           | 304300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1521500  |
| value_loss         | 4.58e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.334    |
| fps                | 917      |
| nupdates           | 304400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1522000  |
| value_loss         | 1.69e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.5      |
| fps                | 917      |
| nupdates           | 304500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1522500  |
| value_loss         | 4.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.619    |
| fps                | 917      |
| nupdates           | 304600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.174    |
| fps                | 916      |
| nupdates           | 307300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1536500  |
| value_loss         | 2.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.794    |
| fps                | 916      |
| nupdates           | 307400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1537000  |
| value_loss         | 3.57e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.65    |
| fps                | 916      |
| nupdates           | 307500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1537500  |
| value_loss         | 7.53e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.455    |
| fps                | 916      |
| nupdates           | 307600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.442   |
| fps                | 915      |
| nupdates           | 310300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1551500  |
| value_loss         | 0.000281 |
---------------------------------
---------------------------------
| explained_variance | 0.28     |
| fps                | 915      |
| nupdates           | 310400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1552000  |
| value_loss         | 8.89e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 915      |
| nupdates           | 310500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1552500  |
| value_loss         | 1.51e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 915      |
| nupdates           | 310600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.367    |
| fps                | 916      |
| nupdates           | 313400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1567000  |
| value_loss         | 7.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.43     |
| fps                | 916      |
| nupdates           | 313500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1567500  |
| value_loss         | 1.9e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.828    |
| fps                | 916      |
| nupdates           | 313600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1568000  |
| value_loss         | 5.18e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.75    |
| fps                | 916      |
| nupdates           | 313700   |
| policy_entropy     | 1.93     |
| total_timest

---------------------------------
| explained_variance | -5.42    |
| fps                | 915      |
| nupdates           | 316400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1582000  |
| value_loss         | 0.00107  |
---------------------------------
---------------------------------
| explained_variance | -17.2    |
| fps                | 915      |
| nupdates           | 316500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1582500  |
| value_loss         | 0.000887 |
---------------------------------
---------------------------------
| explained_variance | 0.508    |
| fps                | 915      |
| nupdates           | 316600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1583000  |
| value_loss         | 3.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 915      |
| nupdates           | 316700   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -0.504   |
| fps                | 916      |
| nupdates           | 319500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1597500  |
| value_loss         | 0.000482 |
---------------------------------
---------------------------------
| explained_variance | 0.474    |
| fps                | 917      |
| nupdates           | 319600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1598000  |
| value_loss         | 0.000187 |
---------------------------------
---------------------------------
| explained_variance | 0.435    |
| fps                | 917      |
| nupdates           | 319700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1598500  |
| value_loss         | 0.000412 |
---------------------------------
---------------------------------
| explained_variance | -0.324   |
| fps                | 917      |
| nupdates           | 319800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.89     |
| fps                | 915      |
| nupdates           | 322500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1612500  |
| value_loss         | 6.12e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.502   |
| fps                | 915      |
| nupdates           | 322600   |
| policy_entropy     | 1.98     |
| total_timesteps    | 1613000  |
| value_loss         | 0.000289 |
---------------------------------
---------------------------------
| explained_variance | 0.0471   |
| fps                | 915      |
| nupdates           | 322700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1613500  |
| value_loss         | 2.64e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.09    |
| fps                | 915      |
| nupdates           | 322800   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.759    |
| fps                | 914      |
| nupdates           | 325500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1627500  |
| value_loss         | 0.000158 |
---------------------------------
---------------------------------
| explained_variance | -2.38    |
| fps                | 914      |
| nupdates           | 325600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1628000  |
| value_loss         | 0.000339 |
---------------------------------
---------------------------------
| explained_variance | 0.123    |
| fps                | 914      |
| nupdates           | 325700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1628500  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 914      |
| nupdates           | 325800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.592    |
| fps                | 915      |
| nupdates           | 328600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1643000  |
| value_loss         | 0.000143 |
---------------------------------
---------------------------------
| explained_variance | -0.148   |
| fps                | 915      |
| nupdates           | 328700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1643500  |
| value_loss         | 0.00115  |
---------------------------------
---------------------------------
| explained_variance | -0.22    |
| fps                | 915      |
| nupdates           | 328800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1644000  |
| value_loss         | 1.64e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.317    |
| fps                | 915      |
| nupdates           | 328900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.924    |
| fps                | 914      |
| nupdates           | 331600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1658000  |
| value_loss         | 0.000187 |
---------------------------------
---------------------------------
| explained_variance | 0.887    |
| fps                | 914      |
| nupdates           | 331700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1658500  |
| value_loss         | 4.11e-05 |
---------------------------------
---------------------------------
| explained_variance | -81.1    |
| fps                | 914      |
| nupdates           | 331800   |
| policy_entropy     | 2.01     |
| total_timesteps    | 1659000  |
| value_loss         | 0.00424  |
---------------------------------
---------------------------------
| explained_variance | -1.27    |
| fps                | 914      |
| nupdates           | 331900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.137   |
| fps                | 915      |
| nupdates           | 334700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1673500  |
| value_loss         | 0.000316 |
---------------------------------
---------------------------------
| explained_variance | -56.7    |
| fps                | 915      |
| nupdates           | 334800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1674000  |
| value_loss         | 0.00102  |
---------------------------------
---------------------------------
| explained_variance | 0.0658   |
| fps                | 915      |
| nupdates           | 334900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1674500  |
| value_loss         | 0.000297 |
---------------------------------
Eval num_timesteps=1675000, episode_reward=-4.80 +/- 0.40
Episode length: 625.80 +/- 104.17
---------------------------------
| explained_variance | 0.832    |
| fps                | 9

---------------------------------
| explained_variance | 0.204    |
| fps                | 914      |
| nupdates           | 337700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1688500  |
| value_loss         | 0.000151 |
---------------------------------
---------------------------------
| explained_variance | 0.862    |
| fps                | 914      |
| nupdates           | 337800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1689000  |
| value_loss         | 0.000189 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 914      |
| nupdates           | 337900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1689500  |
| value_loss         | 9.59e-07 |
---------------------------------
---------------------------------
| explained_variance | -2.03    |
| fps                | 914      |
| nupdates           | 338000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.2     |
| fps                | 913      |
| nupdates           | 340700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1703500  |
| value_loss         | 9.43e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.177   |
| fps                | 913      |
| nupdates           | 340800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1704000  |
| value_loss         | 0.000205 |
---------------------------------
---------------------------------
| explained_variance | 0.91     |
| fps                | 913      |
| nupdates           | 340900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1704500  |
| value_loss         | 1.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.424    |
| fps                | 913      |
| nupdates           | 341000   |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | -1.77    |
| fps                | 914      |
| nupdates           | 343800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1719000  |
| value_loss         | 0.000594 |
---------------------------------
---------------------------------
| explained_variance | -4.12    |
| fps                | 914      |
| nupdates           | 343900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1719500  |
| value_loss         | 0.00196  |
---------------------------------
---------------------------------
| explained_variance | -18.9    |
| fps                | 914      |
| nupdates           | 344000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1720000  |
| value_loss         | 0.00403  |
---------------------------------
---------------------------------
| explained_variance | -40.5    |
| fps                | 914      |
| nupdates           | 344100   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.151   |
| fps                | 913      |
| nupdates           | 346800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1734000  |
| value_loss         | 4.21e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.867   |
| fps                | 913      |
| nupdates           | 346900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1734500  |
| value_loss         | 0.00133  |
---------------------------------
---------------------------------
| explained_variance | 0.845    |
| fps                | 914      |
| nupdates           | 347000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1735000  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.706    |
| fps                | 914      |
| nupdates           | 347100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.78    |
| fps                | 915      |
| nupdates           | 349900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1749500  |
| value_loss         | 0.00168  |
---------------------------------
Eval num_timesteps=1750000, episode_reward=-4.80 +/- 0.40
Episode length: 542.90 +/- 37.28
---------------------------------
| explained_variance | 0.131    |
| fps                | 913      |
| nupdates           | 350000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1750000  |
| value_loss         | 0.000171 |
---------------------------------
---------------------------------
| explained_variance | -0.103   |
| fps                | 913      |
| nupdates           | 350100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1750500  |
| value_loss         | 0.000443 |
---------------------------------
---------------------------------
| explained_variance | 0.203    |
| fps                | 91

---------------------------------
| explained_variance | -1.51    |
| fps                | 914      |
| nupdates           | 352900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1764500  |
| value_loss         | 0.000226 |
---------------------------------
---------------------------------
| explained_variance | -0.0181  |
| fps                | 914      |
| nupdates           | 353000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1765000  |
| value_loss         | 0.16     |
---------------------------------
---------------------------------
| explained_variance | 0.0372   |
| fps                | 914      |
| nupdates           | 353100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1765500  |
| value_loss         | 0.000257 |
---------------------------------
---------------------------------
| explained_variance | -58.9    |
| fps                | 914      |
| nupdates           | 353200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.133   |
| fps                | 914      |
| nupdates           | 355900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1779500  |
| value_loss         | 1.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.751    |
| fps                | 914      |
| nupdates           | 356000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1780000  |
| value_loss         | 4.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.644    |
| fps                | 914      |
| nupdates           | 356100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1780500  |
| value_loss         | 8.18e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.583   |
| fps                | 914      |
| nupdates           | 356200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -9.84    |
| fps                | 915      |
| nupdates           | 359000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1795000  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.666    |
| fps                | 915      |
| nupdates           | 359100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1795500  |
| value_loss         | 5.52e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0564   |
| fps                | 915      |
| nupdates           | 359200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1796000  |
| value_loss         | 0.000318 |
---------------------------------
---------------------------------
| explained_variance | -8.03    |
| fps                | 915      |
| nupdates           | 359300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.318    |
| fps                | 915      |
| nupdates           | 362000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1810000  |
| value_loss         | 0.00011  |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 915      |
| nupdates           | 362100   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1810500  |
| value_loss         | 0.000584 |
---------------------------------
---------------------------------
| explained_variance | -0.503   |
| fps                | 915      |
| nupdates           | 362200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1811000  |
| value_loss         | 0.00013  |
---------------------------------
---------------------------------
| explained_variance | 0.472    |
| fps                | 915      |
| nupdates           | 362300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -33.4    |
| fps                | 913      |
| nupdates           | 365100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1825500  |
| value_loss         | 0.000687 |
---------------------------------
---------------------------------
| explained_variance | -1.56    |
| fps                | 913      |
| nupdates           | 365200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1826000  |
| value_loss         | 0.000147 |
---------------------------------
---------------------------------
| explained_variance | -1.69    |
| fps                | 913      |
| nupdates           | 365300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1826500  |
| value_loss         | 0.000259 |
---------------------------------
---------------------------------
| explained_variance | 0.257    |
| fps                | 914      |
| nupdates           | 365400   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.232   |
| fps                | 915      |
| nupdates           | 368200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1841000  |
| value_loss         | 3.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.622    |
| fps                | 915      |
| nupdates           | 368300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1841500  |
| value_loss         | 0.000532 |
---------------------------------
---------------------------------
| explained_variance | 0.645    |
| fps                | 915      |
| nupdates           | 368400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1842000  |
| value_loss         | 0.000214 |
---------------------------------
---------------------------------
| explained_variance | 0.00337  |
| fps                | 914      |
| nupdates           | 368500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.941    |
| fps                | 913      |
| nupdates           | 371200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1856000  |
| value_loss         | 2.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.307    |
| fps                | 913      |
| nupdates           | 371300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1856500  |
| value_loss         | 0.000206 |
---------------------------------
---------------------------------
| explained_variance | -1.82    |
| fps                | 913      |
| nupdates           | 371400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1857000  |
| value_loss         | 0.000769 |
---------------------------------
---------------------------------
| explained_variance | 0.883    |
| fps                | 913      |
| nupdates           | 371500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.37     |
| fps                | 914      |
| nupdates           | 374300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1871500  |
| value_loss         | 0.147    |
---------------------------------
---------------------------------
| explained_variance | 0.937    |
| fps                | 914      |
| nupdates           | 374400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1872000  |
| value_loss         | 8.36e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.559    |
| fps                | 914      |
| nupdates           | 374500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1872500  |
| value_loss         | 0.000176 |
---------------------------------
---------------------------------
| explained_variance | 0.903    |
| fps                | 914      |
| nupdates           | 374600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.727   |
| fps                | 913      |
| nupdates           | 377300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1886500  |
| value_loss         | 6.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.928    |
| fps                | 913      |
| nupdates           | 377400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1887000  |
| value_loss         | 9.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 913      |
| nupdates           | 377500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1887500  |
| value_loss         | 2.57e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.563    |
| fps                | 913      |
| nupdates           | 377600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.667    |
| fps                | 913      |
| nupdates           | 380300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1901500  |
| value_loss         | 5.31e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.65    |
| fps                | 913      |
| nupdates           | 380400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1902000  |
| value_loss         | 0.00269  |
---------------------------------
---------------------------------
| explained_variance | -0.317   |
| fps                | 913      |
| nupdates           | 380500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1902500  |
| value_loss         | 6.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.944    |
| fps                | 913      |
| nupdates           | 380600   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.64     |
| fps                | 914      |
| nupdates           | 383400   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1917000  |
| value_loss         | 9.3e-05  |
---------------------------------
---------------------------------
| explained_variance | -1.28    |
| fps                | 914      |
| nupdates           | 383500   |
| policy_entropy     | 1.98     |
| total_timesteps    | 1917500  |
| value_loss         | 0.000392 |
---------------------------------
---------------------------------
| explained_variance | -1.35    |
| fps                | 914      |
| nupdates           | 383600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1918000  |
| value_loss         | 0.000157 |
---------------------------------
---------------------------------
| explained_variance | -2.2     |
| fps                | 914      |
| nupdates           | 383700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.838    |
| fps                | 913      |
| nupdates           | 386400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1932000  |
| value_loss         | 2.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.701    |
| fps                | 913      |
| nupdates           | 386500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1932500  |
| value_loss         | 3.99e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.643    |
| fps                | 913      |
| nupdates           | 386600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1933000  |
| value_loss         | 0.000564 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 913      |
| nupdates           | 386700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -7.22    |
| fps                | 914      |
| nupdates           | 389500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1947500  |
| value_loss         | 0.00329  |
---------------------------------
---------------------------------
| explained_variance | -0.214   |
| fps                | 914      |
| nupdates           | 389600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1948000  |
| value_loss         | 0.000191 |
---------------------------------
---------------------------------
| explained_variance | -1.63    |
| fps                | 914      |
| nupdates           | 389700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1948500  |
| value_loss         | 0.00337  |
---------------------------------
---------------------------------
| explained_variance | -4.39    |
| fps                | 914      |
| nupdates           | 389800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.955    |
| fps                | 913      |
| nupdates           | 392500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1962500  |
| value_loss         | 3.66e-05 |
---------------------------------
----------------------------------
| explained_variance | -7.49e+03 |
| fps                | 913       |
| nupdates           | 392600    |
| policy_entropy     | 2.05      |
| total_timesteps    | 1963000   |
| value_loss         | 0.136     |
----------------------------------
---------------------------------
| explained_variance | 0.951    |
| fps                | 913      |
| nupdates           | 392700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1963500  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | -0.746   |
| fps                | 914      |
| nupdates           | 392800   |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | 0.902    |
| fps                | 912      |
| nupdates           | 395500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1977500  |
| value_loss         | 9.96e-05 |
---------------------------------
---------------------------------
| explained_variance | -13.5    |
| fps                | 912      |
| nupdates           | 395600   |
| policy_entropy     | 1.98     |
| total_timesteps    | 1978000  |
| value_loss         | 0.00471  |
---------------------------------
---------------------------------
| explained_variance | -17.2    |
| fps                | 912      |
| nupdates           | 395700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1978500  |
| value_loss         | 0.00415  |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 912      |
| nupdates           | 395800   |
| policy_entropy     | 1.97     |
| total_timest

---------------------------------
| explained_variance | 0.999    |
| fps                | 913      |
| nupdates           | 398600   |
| policy_entropy     | 1.97     |
| total_timesteps    | 1993000  |
| value_loss         | 3.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.132    |
| fps                | 913      |
| nupdates           | 398700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1993500  |
| value_loss         | 6.82e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.321   |
| fps                | 913      |
| nupdates           | 398800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1994000  |
| value_loss         | 0.000132 |
---------------------------------
---------------------------------
| explained_variance | 0.877    |
| fps                | 913      |
| nupdates           | 398900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.912    |
| fps                | 912      |
| nupdates           | 401600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2008000  |
| value_loss         | 2.99e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.611   |
| fps                | 912      |
| nupdates           | 401700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2008500  |
| value_loss         | 0.00093  |
---------------------------------
---------------------------------
| explained_variance | 0.593    |
| fps                | 912      |
| nupdates           | 401800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2009000  |
| value_loss         | 2.96e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.78    |
| fps                | 912      |
| nupdates           | 401900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.043    |
| fps                | 913      |
| nupdates           | 404700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2023500  |
| value_loss         | 0.00152  |
---------------------------------
---------------------------------
| explained_variance | 0.0236   |
| fps                | 913      |
| nupdates           | 404800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2024000  |
| value_loss         | 1.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0964   |
| fps                | 913      |
| nupdates           | 404900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2024500  |
| value_loss         | 8.21e-05 |
---------------------------------
Eval num_timesteps=2025000, episode_reward=-4.90 +/- 0.30
Episode length: 627.10 +/- 154.50
---------------------------------
| explained_variance | -0.254   |
| fps                | 9

---------------------------------
| explained_variance | -1.09    |
| fps                | 911      |
| nupdates           | 407700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2038500  |
| value_loss         | 4.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.475    |
| fps                | 911      |
| nupdates           | 407800   |
| policy_entropy     | 2        |
| total_timesteps    | 2039000  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.279    |
| fps                | 911      |
| nupdates           | 407900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2039500  |
| value_loss         | 0.000357 |
---------------------------------
---------------------------------
| explained_variance | -1.06    |
| fps                | 911      |
| nupdates           | 408000   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.83     |
| fps                | 909      |
| nupdates           | 410700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2053500  |
| value_loss         | 0.00023  |
---------------------------------
---------------------------------
| explained_variance | -0.715   |
| fps                | 909      |
| nupdates           | 410800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2054000  |
| value_loss         | 0.000374 |
---------------------------------
---------------------------------
| explained_variance | -6.97    |
| fps                | 909      |
| nupdates           | 410900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2054500  |
| value_loss         | 0.000625 |
---------------------------------
---------------------------------
| explained_variance | -892     |
| fps                | 909      |
| nupdates           | 411000   |
| policy_entropy     | 1.89     |
| total_timest

---------------------------------
| explained_variance | 0.236    |
| fps                | 909      |
| nupdates           | 413800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2069000  |
| value_loss         | 8.19e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 909      |
| nupdates           | 413900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2069500  |
| value_loss         | 2.29e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.868    |
| fps                | 909      |
| nupdates           | 414000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2070000  |
| value_loss         | 9.19e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0195  |
| fps                | 909      |
| nupdates           | 414100   |
| policy_entropy     | 1.93     |
| total_timest

---------------------------------
| explained_variance | -22.1    |
| fps                | 907      |
| nupdates           | 416800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2084000  |
| value_loss         | 0.000611 |
---------------------------------
---------------------------------
| explained_variance | -0.409   |
| fps                | 907      |
| nupdates           | 416900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2084500  |
| value_loss         | 0.000238 |
---------------------------------
---------------------------------
| explained_variance | 0.661    |
| fps                | 907      |
| nupdates           | 417000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2085000  |
| value_loss         | 3.6e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.862    |
| fps                | 907      |
| nupdates           | 417100   |
| policy_entropy     | 1.96     |
| total_timest

---------------------------------
| explained_variance | 0.654    |
| fps                | 907      |
| nupdates           | 419900   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2099500  |
| value_loss         | 2.09e-05 |
---------------------------------
Eval num_timesteps=2100000, episode_reward=-4.80 +/- 0.40
Episode length: 629.90 +/- 98.77
---------------------------------
| explained_variance | 0.627    |
| fps                | 906      |
| nupdates           | 420000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2100000  |
| value_loss         | 3.68e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.92    |
| fps                | 906      |
| nupdates           | 420100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2100500  |
| value_loss         | 2.77e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.15    |
| fps                | 90

---------------------------------
| explained_variance | -2.42    |
| fps                | 906      |
| nupdates           | 422900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2114500  |
| value_loss         | 0.000398 |
---------------------------------
---------------------------------
| explained_variance | -3.85    |
| fps                | 906      |
| nupdates           | 423000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2115000  |
| value_loss         | 0.000779 |
---------------------------------
---------------------------------
| explained_variance | 0.452    |
| fps                | 905      |
| nupdates           | 423100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2115500  |
| value_loss         | 0.000248 |
---------------------------------
---------------------------------
| explained_variance | -0.593   |
| fps                | 905      |
| nupdates           | 423200   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.312    |
| fps                | 903      |
| nupdates           | 425900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2129500  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.881    |
| fps                | 903      |
| nupdates           | 426000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2130000  |
| value_loss         | 9.04e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.021   |
| fps                | 903      |
| nupdates           | 426100   |
| policy_entropy     | 1.8      |
| total_timesteps    | 2130500  |
| value_loss         | 0.403    |
---------------------------------
---------------------------------
| explained_variance | 0.612    |
| fps                | 903      |
| nupdates           | 426200   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.662    |
| fps                | 903      |
| nupdates           | 429000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2145000  |
| value_loss         | 2.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 903      |
| nupdates           | 429100   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2145500  |
| value_loss         | 2.25e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.377    |
| fps                | 903      |
| nupdates           | 429200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2146000  |
| value_loss         | 3.32e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 903      |
| nupdates           | 429300   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -6.62    |
| fps                | 902      |
| nupdates           | 432000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2160000  |
| value_loss         | 0.000327 |
---------------------------------
---------------------------------
| explained_variance | -3.41    |
| fps                | 902      |
| nupdates           | 432100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2160500  |
| value_loss         | 0.00113  |
---------------------------------
---------------------------------
| explained_variance | -2.78    |
| fps                | 902      |
| nupdates           | 432200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2161000  |
| value_loss         | 0.00023  |
---------------------------------
---------------------------------
| explained_variance | 0.667    |
| fps                | 902      |
| nupdates           | 432300   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.736    |
| fps                | 900      |
| nupdates           | 435100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2175500  |
| value_loss         | 6.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.795    |
| fps                | 900      |
| nupdates           | 435200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2176000  |
| value_loss         | 4.8e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.295   |
| fps                | 900      |
| nupdates           | 435300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2176500  |
| value_loss         | 0.000432 |
---------------------------------
---------------------------------
| explained_variance | -0.00521 |
| fps                | 900      |
| nupdates           | 435400   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.706    |
| fps                | 900      |
| nupdates           | 438200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2191000  |
| value_loss         | 6.01e-06 |
---------------------------------
---------------------------------
| explained_variance | -5.61    |
| fps                | 900      |
| nupdates           | 438300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2191500  |
| value_loss         | 0.000236 |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 900      |
| nupdates           | 438400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2192000  |
| value_loss         | 1.09e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.95    |
| fps                | 900      |
| nupdates           | 438500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -4.34    |
| fps                | 899      |
| nupdates           | 441200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2206000  |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | 0.466    |
| fps                | 899      |
| nupdates           | 441300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2206500  |
| value_loss         | 4.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.239   |
| fps                | 899      |
| nupdates           | 441400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2207000  |
| value_loss         | 0.000226 |
---------------------------------
---------------------------------
| explained_variance | 0.629    |
| fps                | 899      |
| nupdates           | 441500   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.677    |
| fps                | 899      |
| nupdates           | 444300   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2221500  |
| value_loss         | 6.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.02    |
| fps                | 899      |
| nupdates           | 444400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2222000  |
| value_loss         | 0.00195  |
---------------------------------
---------------------------------
| explained_variance | 0.618    |
| fps                | 899      |
| nupdates           | 444500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2222500  |
| value_loss         | 0.000161 |
---------------------------------
---------------------------------
| explained_variance | 0.671    |
| fps                | 899      |
| nupdates           | 444600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.63     |
| fps                | 897      |
| nupdates           | 447300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2236500  |
| value_loss         | 8.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.572    |
| fps                | 897      |
| nupdates           | 447400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2237000  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | 0.589    |
| fps                | 897      |
| nupdates           | 447500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2237500  |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | -1.41    |
| fps                | 897      |
| nupdates           | 447600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -11.3    |
| fps                | 895      |
| nupdates           | 450300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2251500  |
| value_loss         | 0.00259  |
---------------------------------
---------------------------------
| explained_variance | 0.943    |
| fps                | 895      |
| nupdates           | 450400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2252000  |
| value_loss         | 5.85e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0768   |
| fps                | 895      |
| nupdates           | 450500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2252500  |
| value_loss         | 5.96e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.173   |
| fps                | 895      |
| nupdates           | 450600   |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | 0.298    |
| fps                | 895      |
| nupdates           | 453400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2267000  |
| value_loss         | 1.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 895      |
| nupdates           | 453500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2267500  |
| value_loss         | 1.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.14    |
| fps                | 895      |
| nupdates           | 453600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2268000  |
| value_loss         | 0.000435 |
---------------------------------
---------------------------------
| explained_variance | 0.678    |
| fps                | 895      |
| nupdates           | 453700   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.807    |
| fps                | 894      |
| nupdates           | 456400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2282000  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | -1       |
| fps                | 894      |
| nupdates           | 456500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2282500  |
| value_loss         | 0.000586 |
---------------------------------
---------------------------------
| explained_variance | -0.157   |
| fps                | 894      |
| nupdates           | 456600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2283000  |
| value_loss         | 0.000199 |
---------------------------------
---------------------------------
| explained_variance | -30.7    |
| fps                | 894      |
| nupdates           | 456700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.569    |
| fps                | 894      |
| nupdates           | 459500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2297500  |
| value_loss         | 6.43e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.898    |
| fps                | 894      |
| nupdates           | 459600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2298000  |
| value_loss         | 8.46e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.343    |
| fps                | 894      |
| nupdates           | 459700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2298500  |
| value_loss         | 0.000168 |
---------------------------------
---------------------------------
| explained_variance | 0.269    |
| fps                | 894      |
| nupdates           | 459800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.862    |
| fps                | 893      |
| nupdates           | 462500   |
| policy_entropy     | 2        |
| total_timesteps    | 2312500  |
| value_loss         | 3.89e-05 |
---------------------------------
---------------------------------
| explained_variance | -28.4    |
| fps                | 893      |
| nupdates           | 462600   |
| policy_entropy     | 2        |
| total_timesteps    | 2313000  |
| value_loss         | 0.00129  |
---------------------------------
---------------------------------
| explained_variance | -10.9    |
| fps                | 893      |
| nupdates           | 462700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2313500  |
| value_loss         | 0.0033   |
---------------------------------
---------------------------------
| explained_variance | 0.615    |
| fps                | 893      |
| nupdates           | 462800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.267   |
| fps                | 892      |
| nupdates           | 465500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2327500  |
| value_loss         | 0.00012  |
---------------------------------
---------------------------------
| explained_variance | -8.96    |
| fps                | 892      |
| nupdates           | 465600   |
| policy_entropy     | 1.92     |
| total_timesteps    | 2328000  |
| value_loss         | 0.00762  |
---------------------------------
---------------------------------
| explained_variance | -7.64    |
| fps                | 892      |
| nupdates           | 465700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2328500  |
| value_loss         | 0.0042   |
---------------------------------
---------------------------------
| explained_variance | -0.28    |
| fps                | 892      |
| nupdates           | 465800   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.0165  |
| fps                | 892      |
| nupdates           | 468600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2343000  |
| value_loss         | 0.000153 |
---------------------------------
---------------------------------
| explained_variance | -2.3     |
| fps                | 892      |
| nupdates           | 468700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2343500  |
| value_loss         | 0.000141 |
---------------------------------
---------------------------------
| explained_variance | 0.866    |
| fps                | 892      |
| nupdates           | 468800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2344000  |
| value_loss         | 2.8e-05  |
---------------------------------
---------------------------------
| explained_variance | -3.19    |
| fps                | 892      |
| nupdates           | 468900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.926    |
| fps                | 890      |
| nupdates           | 471600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2358000  |
| value_loss         | 6.07e-05 |
---------------------------------
---------------------------------
| explained_variance | -15.5    |
| fps                | 890      |
| nupdates           | 471700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2358500  |
| value_loss         | 0.00489  |
---------------------------------
---------------------------------
| explained_variance | -0.137   |
| fps                | 890      |
| nupdates           | 471800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2359000  |
| value_loss         | 0.000327 |
---------------------------------
---------------------------------
| explained_variance | -0.122   |
| fps                | 890      |
| nupdates           | 471900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -7.58    |
| fps                | 890      |
| nupdates           | 474700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2373500  |
| value_loss         | 0.00191  |
---------------------------------
---------------------------------
| explained_variance | -3.63    |
| fps                | 890      |
| nupdates           | 474800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2374000  |
| value_loss         | 0.00484  |
---------------------------------
---------------------------------
| explained_variance | -2.19    |
| fps                | 890      |
| nupdates           | 474900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2374500  |
| value_loss         | 0.000453 |
---------------------------------
Eval num_timesteps=2375000, episode_reward=-4.80 +/- 0.40
Episode length: 660.70 +/- 151.90
---------------------------------
| explained_variance | -2.83    |
| fps                | 8

---------------------------------
| explained_variance | -5.4     |
| fps                | 889      |
| nupdates           | 477700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2388500  |
| value_loss         | 0.000327 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 889      |
| nupdates           | 477800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2389000  |
| value_loss         | 9.97e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.609    |
| fps                | 889      |
| nupdates           | 477900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2389500  |
| value_loss         | 2e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.178    |
| fps                | 889      |
| nupdates           | 478000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.837    |
| fps                | 888      |
| nupdates           | 480700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2403500  |
| value_loss         | 2.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.501    |
| fps                | 888      |
| nupdates           | 480800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2404000  |
| value_loss         | 0.00068  |
---------------------------------
---------------------------------
| explained_variance | 0.627    |
| fps                | 888      |
| nupdates           | 480900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2404500  |
| value_loss         | 0.000129 |
---------------------------------
---------------------------------
| explained_variance | 0.499    |
| fps                | 888      |
| nupdates           | 481000   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.12    |
| fps                | 888      |
| nupdates           | 483800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2419000  |
| value_loss         | 0.000541 |
---------------------------------
---------------------------------
| explained_variance | -0.837   |
| fps                | 888      |
| nupdates           | 483900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2419500  |
| value_loss         | 0.000146 |
---------------------------------
---------------------------------
| explained_variance | 0.813    |
| fps                | 888      |
| nupdates           | 484000   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2420000  |
| value_loss         | 2.12e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.53    |
| fps                | 888      |
| nupdates           | 484100   |
| policy_entropy     | 1.98     |
| total_timest

---------------------------------
| explained_variance | 0.986    |
| fps                | 887      |
| nupdates           | 486800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2434000  |
| value_loss         | 2.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.956    |
| fps                | 887      |
| nupdates           | 486900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2434500  |
| value_loss         | 7.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.356    |
| fps                | 887      |
| nupdates           | 487000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2435000  |
| value_loss         | 0.000375 |
---------------------------------
---------------------------------
| explained_variance | 0.947    |
| fps                | 887      |
| nupdates           | 487100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.581   |
| fps                | 887      |
| nupdates           | 489900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2449500  |
| value_loss         | 0.000291 |
---------------------------------
Eval num_timesteps=2450000, episode_reward=-4.40 +/- 1.20
Episode length: 634.00 +/- 167.89
New best mean reward!
---------------------------------
| explained_variance | 0.845    |
| fps                | 886      |
| nupdates           | 490000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2450000  |
| value_loss         | 5.93e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.809    |
| fps                | 886      |
| nupdates           | 490100   |
| policy_entropy     | 1.99     |
| total_timesteps    | 2450500  |
| value_loss         | 0.0444   |
---------------------------------
---------------------------------
| explained_variance | 0.885    |
| 

---------------------------------
| explained_variance | -8.54    |
| fps                | 885      |
| nupdates           | 492900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2464500  |
| value_loss         | 0.000459 |
---------------------------------
---------------------------------
| explained_variance | -9.5e+03 |
| fps                | 886      |
| nupdates           | 493000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2465000  |
| value_loss         | 0.303    |
---------------------------------
---------------------------------
| explained_variance | 0.84     |
| fps                | 886      |
| nupdates           | 493100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2465500  |
| value_loss         | 0.00019  |
---------------------------------
---------------------------------
| explained_variance | 0.0756   |
| fps                | 886      |
| nupdates           | 493200   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -477     |
| fps                | 884      |
| nupdates           | 495900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2479500  |
| value_loss         | 0.0119   |
---------------------------------
---------------------------------
| explained_variance | -48.2    |
| fps                | 884      |
| nupdates           | 496000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2480000  |
| value_loss         | 0.00404  |
---------------------------------
---------------------------------
| explained_variance | -0.646   |
| fps                | 884      |
| nupdates           | 496100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2480500  |
| value_loss         | 0.000215 |
---------------------------------
---------------------------------
| explained_variance | -0.155   |
| fps                | 884      |
| nupdates           | 496200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.77     |
| fps                | 884      |
| nupdates           | 499000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2495000  |
| value_loss         | 2.45e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.532   |
| fps                | 884      |
| nupdates           | 499100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2495500  |
| value_loss         | 7.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.827    |
| fps                | 884      |
| nupdates           | 499200   |
| policy_entropy     | 1.99     |
| total_timesteps    | 2496000  |
| value_loss         | 0.000253 |
---------------------------------
---------------------------------
| explained_variance | 0.291    |
| fps                | 884      |
| nupdates           | 499300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.994    |
| fps                | 883      |
| nupdates           | 502000   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2510000  |
| value_loss         | 3.55e-05 |
---------------------------------
---------------------------------
| explained_variance | -24.1    |
| fps                | 883      |
| nupdates           | 502100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2510500  |
| value_loss         | 0.00023  |
---------------------------------
---------------------------------
| explained_variance | 0.905    |
| fps                | 883      |
| nupdates           | 502200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2511000  |
| value_loss         | 1.03e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.9     |
| fps                | 883      |
| nupdates           | 502300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.559    |
| fps                | 881      |
| nupdates           | 505100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2525500  |
| value_loss         | 0.000207 |
---------------------------------
---------------------------------
| explained_variance | -30.5    |
| fps                | 881      |
| nupdates           | 505200   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2526000  |
| value_loss         | 0.00336  |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 881      |
| nupdates           | 505300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2526500  |
| value_loss         | 7.99e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.72     |
| fps                | 881      |
| nupdates           | 505400   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -14.5    |
| fps                | 882      |
| nupdates           | 508200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2541000  |
| value_loss         | 0.00177  |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 882      |
| nupdates           | 508300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2541500  |
| value_loss         | 3.38e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.29    |
| fps                | 882      |
| nupdates           | 508400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2542000  |
| value_loss         | 0.000378 |
---------------------------------
---------------------------------
| explained_variance | 0.572    |
| fps                | 882      |
| nupdates           | 508500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -285     |
| fps                | 881      |
| nupdates           | 511200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2556000  |
| value_loss         | 0.000192 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 881      |
| nupdates           | 511300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2556500  |
| value_loss         | 9.67e-06 |
---------------------------------
---------------------------------
| explained_variance | -24.9    |
| fps                | 881      |
| nupdates           | 511400   |
| policy_entropy     | 1.98     |
| total_timesteps    | 2557000  |
| value_loss         | 0.0036   |
---------------------------------
---------------------------------
| explained_variance | -20.8    |
| fps                | 881      |
| nupdates           | 511500   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.393    |
| fps                | 881      |
| nupdates           | 514300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2571500  |
| value_loss         | 0.000243 |
---------------------------------
---------------------------------
| explained_variance | 0.877    |
| fps                | 881      |
| nupdates           | 514400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2572000  |
| value_loss         | 2.01e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.477   |
| fps                | 881      |
| nupdates           | 514500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2572500  |
| value_loss         | 0.000165 |
---------------------------------
---------------------------------
| explained_variance | 0.68     |
| fps                | 881      |
| nupdates           | 514600   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.882   |
| fps                | 879      |
| nupdates           | 517300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2586500  |
| value_loss         | 9.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.873    |
| fps                | 879      |
| nupdates           | 517400   |
| policy_entropy     | 1.94     |
| total_timesteps    | 2587000  |
| value_loss         | 5.54e-05 |
---------------------------------
---------------------------------
| explained_variance | -105     |
| fps                | 879      |
| nupdates           | 517500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2587500  |
| value_loss         | 0.00573  |
---------------------------------
---------------------------------
| explained_variance | 0.269    |
| fps                | 879      |
| nupdates           | 517600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.512   |
| fps                | 878      |
| nupdates           | 520300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2601500  |
| value_loss         | 0.000196 |
---------------------------------
---------------------------------
| explained_variance | 0.81     |
| fps                | 878      |
| nupdates           | 520400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2602000  |
| value_loss         | 5.17e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.57    |
| fps                | 878      |
| nupdates           | 520500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2602500  |
| value_loss         | 0.000317 |
---------------------------------
---------------------------------
| explained_variance | -31.4    |
| fps                | 878      |
| nupdates           | 520600   |
| policy_entropy     | 1.9      |
| total_timest

---------------------------------
| explained_variance | -1.34    |
| fps                | 878      |
| nupdates           | 523400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2617000  |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | 0.923    |
| fps                | 878      |
| nupdates           | 523500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2617500  |
| value_loss         | 4.67e-05 |
---------------------------------
---------------------------------
| explained_variance | -13.2    |
| fps                | 878      |
| nupdates           | 523600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2618000  |
| value_loss         | 0.00418  |
---------------------------------
---------------------------------
| explained_variance | 0.56     |
| fps                | 878      |
| nupdates           | 523700   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.44    |
| fps                | 877      |
| nupdates           | 526400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2632000  |
| value_loss         | 2.16e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 877      |
| nupdates           | 526500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2632500  |
| value_loss         | 5.31e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.52     |
| fps                | 877      |
| nupdates           | 526600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2633000  |
| value_loss         | 4.34e-05 |
---------------------------------
---------------------------------
| explained_variance | -10.5    |
| fps                | 877      |
| nupdates           | 526700   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.214   |
| fps                | 877      |
| nupdates           | 529500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2647500  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | -0.175   |
| fps                | 877      |
| nupdates           | 529600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2648000  |
| value_loss         | 0.000302 |
---------------------------------
----------------------------------
| explained_variance | -4.01e+03 |
| fps                | 877       |
| nupdates           | 529700    |
| policy_entropy     | 2.07      |
| total_timesteps    | 2648500   |
| value_loss         | 0.167     |
----------------------------------
---------------------------------
| explained_variance | 0.0216   |
| fps                | 877      |
| nupdates           | 529800   |
| policy_entropy     | 2.08     |
| tota

---------------------------------
| explained_variance | 0.754    |
| fps                | 876      |
| nupdates           | 532500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2662500  |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | 0.939    |
| fps                | 876      |
| nupdates           | 532600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2663000  |
| value_loss         | 3.26e-05 |
---------------------------------
----------------------------------
| explained_variance | -8.58e+03 |
| fps                | 876       |
| nupdates           | 532700    |
| policy_entropy     | 2.04      |
| total_timesteps    | 2663500   |
| value_loss         | 0.372     |
----------------------------------
---------------------------------
| explained_variance | 0.494    |
| fps                | 876      |
| nupdates           | 532800   |
| policy_entropy     | 2.07     |
| tota

---------------------------------
| explained_variance | 0.118    |
| fps                | 875      |
| nupdates           | 535500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2677500  |
| value_loss         | 0.000609 |
---------------------------------
---------------------------------
| explained_variance | -0.166   |
| fps                | 875      |
| nupdates           | 535600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2678000  |
| value_loss         | 0.000138 |
---------------------------------
---------------------------------
| explained_variance | 0.952    |
| fps                | 875      |
| nupdates           | 535700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2678500  |
| value_loss         | 5.3e-06  |
---------------------------------
---------------------------------
| explained_variance | -0.733   |
| fps                | 875      |
| nupdates           | 535800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.874   |
| fps                | 875      |
| nupdates           | 538600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2693000  |
| value_loss         | 0.000226 |
---------------------------------
---------------------------------
| explained_variance | 0.051    |
| fps                | 875      |
| nupdates           | 538700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2693500  |
| value_loss         | 6.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.88     |
| fps                | 875      |
| nupdates           | 538800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2694000  |
| value_loss         | 0.000236 |
---------------------------------
---------------------------------
| explained_variance | -21      |
| fps                | 875      |
| nupdates           | 538900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.875    |
| fps                | 874      |
| nupdates           | 541600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2708000  |
| value_loss         | 4.58e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 874      |
| nupdates           | 541700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2708500  |
| value_loss         | 4.36e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 874      |
| nupdates           | 541800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2709000  |
| value_loss         | 2.82e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.277    |
| fps                | 874      |
| nupdates           | 541900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.888    |
| fps                | 874      |
| nupdates           | 544700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2723500  |
| value_loss         | 9.16e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.07    |
| fps                | 874      |
| nupdates           | 544800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2724000  |
| value_loss         | 0.000524 |
---------------------------------
---------------------------------
| explained_variance | 0.797    |
| fps                | 874      |
| nupdates           | 544900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2724500  |
| value_loss         | 0.000121 |
---------------------------------
Eval num_timesteps=2725000, episode_reward=-4.90 +/- 0.30
Episode length: 589.30 +/- 106.80
---------------------------------
| explained_variance | 0.089    |
| fps                | 8

---------------------------------
| explained_variance | 0.679    |
| fps                | 873      |
| nupdates           | 547700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2738500  |
| value_loss         | 7.52e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.929    |
| fps                | 873      |
| nupdates           | 547800   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2739000  |
| value_loss         | 1.19e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.02    |
| fps                | 873      |
| nupdates           | 547900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2739500  |
| value_loss         | 0.000462 |
---------------------------------
---------------------------------
| explained_variance | 0.909    |
| fps                | 873      |
| nupdates           | 548000   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.63     |
| fps                | 872      |
| nupdates           | 550700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2753500  |
| value_loss         | 0.000266 |
---------------------------------
---------------------------------
| explained_variance | 0.861    |
| fps                | 872      |
| nupdates           | 550800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2754000  |
| value_loss         | 5.98e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.88     |
| fps                | 872      |
| nupdates           | 550900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2754500  |
| value_loss         | 5.73e-05 |
---------------------------------
---------------------------------
| explained_variance | -285     |
| fps                | 872      |
| nupdates           | 551000   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -1.2     |
| fps                | 872      |
| nupdates           | 553800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2769000  |
| value_loss         | 6.86e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.07    |
| fps                | 872      |
| nupdates           | 553900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2769500  |
| value_loss         | 0.000185 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 872      |
| nupdates           | 554000   |
| policy_entropy     | 1.87     |
| total_timesteps    | 2770000  |
| value_loss         | 0.000402 |
---------------------------------
---------------------------------
| explained_variance | 0.654    |
| fps                | 872      |
| nupdates           | 554100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.953    |
| fps                | 870      |
| nupdates           | 556800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2784000  |
| value_loss         | 4.89e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.798    |
| fps                | 870      |
| nupdates           | 556900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2784500  |
| value_loss         | 9.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.24    |
| fps                | 870      |
| nupdates           | 557000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2785000  |
| value_loss         | 6.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 870      |
| nupdates           | 557100   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.82    |
| fps                | 870      |
| nupdates           | 559900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2799500  |
| value_loss         | 0.000402 |
---------------------------------
Eval num_timesteps=2800000, episode_reward=-4.90 +/- 0.30
Episode length: 689.20 +/- 196.55
---------------------------------
| explained_variance | -10.5    |
| fps                | 869      |
| nupdates           | 560000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2800000  |
| value_loss         | 9.1e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.875    |
| fps                | 869      |
| nupdates           | 560100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2800500  |
| value_loss         | 4.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.932    |
| fps                | 8

---------------------------------
| explained_variance | -0.374   |
| fps                | 869      |
| nupdates           | 562900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2814500  |
| value_loss         | 8.53e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.72    |
| fps                | 868      |
| nupdates           | 563000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2815000  |
| value_loss         | 3.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.479    |
| fps                | 868      |
| nupdates           | 563100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2815500  |
| value_loss         | 5.61e-05 |
---------------------------------
---------------------------------
| explained_variance | -205     |
| fps                | 868      |
| nupdates           | 563200   |
| policy_entropy     | 1.94     |
| total_timest

---------------------------------
| explained_variance | 0.278    |
| fps                | 867      |
| nupdates           | 565900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2829500  |
| value_loss         | 1.61e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.218   |
| fps                | 867      |
| nupdates           | 566000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2830000  |
| value_loss         | 0.000258 |
---------------------------------
---------------------------------
| explained_variance | 0.92     |
| fps                | 867      |
| nupdates           | 566100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2830500  |
| value_loss         | 0.000208 |
---------------------------------
---------------------------------
| explained_variance | -4.96    |
| fps                | 867      |
| nupdates           | 566200   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.827    |
| fps                | 866      |
| nupdates           | 569000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2845000  |
| value_loss         | 0.000293 |
---------------------------------
---------------------------------
| explained_variance | 0.68     |
| fps                | 866      |
| nupdates           | 569100   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2845500  |
| value_loss         | 9.53e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.805    |
| fps                | 866      |
| nupdates           | 569200   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2846000  |
| value_loss         | 6.34e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.848    |
| fps                | 866      |
| nupdates           | 569300   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -4.22    |
| fps                | 865      |
| nupdates           | 572000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2860000  |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 865      |
| nupdates           | 572100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2860500  |
| value_loss         | 0.00511  |
---------------------------------
---------------------------------
| explained_variance | -4.67    |
| fps                | 865      |
| nupdates           | 572200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2861000  |
| value_loss         | 0.000564 |
---------------------------------
---------------------------------
| explained_variance | 0.111    |
| fps                | 865      |
| nupdates           | 572300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.505    |
| fps                | 864      |
| nupdates           | 575100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2875500  |
| value_loss         | 0.000277 |
---------------------------------
---------------------------------
| explained_variance | -0.065   |
| fps                | 864      |
| nupdates           | 575200   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2876000  |
| value_loss         | 0.000376 |
---------------------------------
---------------------------------
| explained_variance | -0.979   |
| fps                | 864      |
| nupdates           | 575300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2876500  |
| value_loss         | 0.0019   |
---------------------------------
---------------------------------
| explained_variance | 0.501    |
| fps                | 864      |
| nupdates           | 575400   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.919    |
| fps                | 864      |
| nupdates           | 578200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2891000  |
| value_loss         | 0.000122 |
---------------------------------
---------------------------------
| explained_variance | 0.937    |
| fps                | 864      |
| nupdates           | 578300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2891500  |
| value_loss         | 7.96e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.599    |
| fps                | 864      |
| nupdates           | 578400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2892000  |
| value_loss         | 0.000183 |
---------------------------------
---------------------------------
| explained_variance | 0.161    |
| fps                | 864      |
| nupdates           | 578500   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.755    |
| fps                | 863      |
| nupdates           | 581200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2906000  |
| value_loss         | 0.000685 |
---------------------------------
---------------------------------
| explained_variance | -6.3     |
| fps                | 863      |
| nupdates           | 581300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2906500  |
| value_loss         | 0.00145  |
---------------------------------
---------------------------------
| explained_variance | 0.361    |
| fps                | 863      |
| nupdates           | 581400   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2907000  |
| value_loss         | 0.102    |
---------------------------------
---------------------------------
| explained_variance | 0.225    |
| fps                | 863      |
| nupdates           | 581600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.42    |
| fps                | 863      |
| nupdates           | 584400   |
| policy_entropy     | 2.01     |
| total_timesteps    | 2922000  |
| value_loss         | 0.000123 |
---------------------------------
---------------------------------
| explained_variance | -0.0778  |
| fps                | 863      |
| nupdates           | 584500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2922500  |
| value_loss         | 0.000393 |
---------------------------------
---------------------------------
| explained_variance | 0.659    |
| fps                | 863      |
| nupdates           | 584600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2923000  |
| value_loss         | 4.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.883    |
| fps                | 863      |
| nupdates           | 584700   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.886    |
| fps                | 861      |
| nupdates           | 587400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2937000  |
| value_loss         | 9.2e-06  |
---------------------------------
---------------------------------
| explained_variance | -3.49    |
| fps                | 861      |
| nupdates           | 587500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2937500  |
| value_loss         | 6.45e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.856    |
| fps                | 861      |
| nupdates           | 587600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2938000  |
| value_loss         | 1.17e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.211    |
| fps                | 861      |
| nupdates           | 587700   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -2.54    |
| fps                | 860      |
| nupdates           | 590400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2952000  |
| value_loss         | 0.000493 |
---------------------------------
---------------------------------
| explained_variance | -0.105   |
| fps                | 860      |
| nupdates           | 590500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2952500  |
| value_loss         | 0.000206 |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 860      |
| nupdates           | 590600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2953000  |
| value_loss         | 1.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.939    |
| fps                | 860      |
| nupdates           | 590700   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.952    |
| fps                | 860      |
| nupdates           | 593500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2967500  |
| value_loss         | 2.94e-05 |
---------------------------------
---------------------------------
| explained_variance | -2       |
| fps                | 860      |
| nupdates           | 593600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2968000  |
| value_loss         | 0.000122 |
---------------------------------
---------------------------------
| explained_variance | -8.67    |
| fps                | 860      |
| nupdates           | 593700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2968500  |
| value_loss         | 0.00099  |
---------------------------------
---------------------------------
| explained_variance | -0.944   |
| fps                | 860      |
| nupdates           | 593800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.956    |
| fps                | 860      |
| nupdates           | 596500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2982500  |
| value_loss         | 1.03e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.302    |
| fps                | 860      |
| nupdates           | 596600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2983000  |
| value_loss         | 0.000622 |
---------------------------------
---------------------------------
| explained_variance | 0.711    |
| fps                | 860      |
| nupdates           | 596700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2983500  |
| value_loss         | 5.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.439    |
| fps                | 860      |
| nupdates           | 596800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.355   |
| fps                | 860      |
| nupdates           | 599600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2998000  |
| value_loss         | 0.00179  |
---------------------------------
---------------------------------
| explained_variance | 0.568    |
| fps                | 860      |
| nupdates           | 599700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2998500  |
| value_loss         | 0.000147 |
---------------------------------
---------------------------------
| explained_variance | -14.2    |
| fps                | 860      |
| nupdates           | 599800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2999000  |
| value_loss         | 0.00341  |
---------------------------------
---------------------------------
| explained_variance | 0.99     |
| fps                | 860      |
| nupdates           | 599900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -2.13    |
| fps                | 860      |
| nupdates           | 602600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3013000  |
| value_loss         | 0.000172 |
---------------------------------
---------------------------------
| explained_variance | 0.944    |
| fps                | 860      |
| nupdates           | 602700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3013500  |
| value_loss         | 2.93e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.339    |
| fps                | 860      |
| nupdates           | 602800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3014000  |
| value_loss         | 0.000133 |
---------------------------------
---------------------------------
| explained_variance | 0.311    |
| fps                | 860      |
| nupdates           | 602900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -13.1    |
| fps                | 859      |
| nupdates           | 605600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3028000  |
| value_loss         | 0.000145 |
---------------------------------
---------------------------------
| explained_variance | 0.242    |
| fps                | 859      |
| nupdates           | 605700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3028500  |
| value_loss         | 9.18e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.69    |
| fps                | 859      |
| nupdates           | 605800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3029000  |
| value_loss         | 0.000351 |
---------------------------------
---------------------------------
| explained_variance | -0.365   |
| fps                | 859      |
| nupdates           | 605900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.586    |
| fps                | 860      |
| nupdates           | 608700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3043500  |
| value_loss         | 2.16e-05 |
---------------------------------
---------------------------------
| explained_variance | -9.76    |
| fps                | 860      |
| nupdates           | 608800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3044000  |
| value_loss         | 0.00104  |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 860      |
| nupdates           | 608900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3044500  |
| value_loss         | 2.34e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.473    |
| fps                | 860      |
| nupdates           | 609000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.911    |
| fps                | 859      |
| nupdates           | 611700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3058500  |
| value_loss         | 1.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.79     |
| fps                | 859      |
| nupdates           | 611800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3059000  |
| value_loss         | 2.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.961    |
| fps                | 859      |
| nupdates           | 611900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3059500  |
| value_loss         | 1.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.893    |
| fps                | 859      |
| nupdates           | 612000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.25     |
| fps                | 859      |
| nupdates           | 614800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3074000  |
| value_loss         | 0.000333 |
---------------------------------
---------------------------------
| explained_variance | -5.64    |
| fps                | 859      |
| nupdates           | 614900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3074500  |
| value_loss         | 0.000422 |
---------------------------------
Eval num_timesteps=3075000, episode_reward=-4.80 +/- 0.40
Episode length: 590.90 +/- 120.00
---------------------------------
| explained_variance | 0.975    |
| fps                | 858      |
| nupdates           | 615000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3075000  |
| value_loss         | 3.57e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.843    |
| fps                | 8

---------------------------------
| explained_variance | 0.84     |
| fps                | 858      |
| nupdates           | 617800   |
| policy_entropy     | 2.01     |
| total_timesteps    | 3089000  |
| value_loss         | 3.11e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.988    |
| fps                | 858      |
| nupdates           | 617900   |
| policy_entropy     | 2.01     |
| total_timesteps    | 3089500  |
| value_loss         | 2.36e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.84    |
| fps                | 858      |
| nupdates           | 618000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3090000  |
| value_loss         | 7.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.959    |
| fps                | 858      |
| nupdates           | 618100   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.151   |
| fps                | 857      |
| nupdates           | 620800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3104000  |
| value_loss         | 0.000167 |
---------------------------------
---------------------------------
| explained_variance | -0.942   |
| fps                | 857      |
| nupdates           | 620900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3104500  |
| value_loss         | 0.000482 |
---------------------------------
---------------------------------
| explained_variance | 0.361    |
| fps                | 857      |
| nupdates           | 621000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3105000  |
| value_loss         | 0.19     |
---------------------------------
---------------------------------
| explained_variance | 0.552    |
| fps                | 857      |
| nupdates           | 621100   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.92     |
| fps                | 857      |
| nupdates           | 623900   |
| policy_entropy     | 1.84     |
| total_timesteps    | 3119500  |
| value_loss         | 5.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.947    |
| fps                | 857      |
| nupdates           | 624000   |
| policy_entropy     | 1.99     |
| total_timesteps    | 3120000  |
| value_loss         | 2.54e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.59    |
| fps                | 857      |
| nupdates           | 624100   |
| policy_entropy     | 2        |
| total_timesteps    | 3120500  |
| value_loss         | 0.00114  |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 857      |
| nupdates           | 624200   |
| policy_entropy     | 1.94     |
| total_timest

---------------------------------
| explained_variance | 0.923    |
| fps                | 856      |
| nupdates           | 626900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3134500  |
| value_loss         | 2.41e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.537    |
| fps                | 856      |
| nupdates           | 627000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3135000  |
| value_loss         | 0.000135 |
---------------------------------
---------------------------------
| explained_variance | 0.42     |
| fps                | 856      |
| nupdates           | 627100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3135500  |
| value_loss         | 1.08e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.187   |
| fps                | 856      |
| nupdates           | 627200   |
| policy_entropy     | 2.07     |
| total_timest

Eval num_timesteps=3150000, episode_reward=-4.80 +/- 0.40
Episode length: 603.10 +/- 122.34
---------------------------------
| explained_variance | -1.02    |
| fps                | 855      |
| nupdates           | 630000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3150000  |
| value_loss         | 3.39e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.553    |
| fps                | 855      |
| nupdates           | 630100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3150500  |
| value_loss         | 1.9e-05  |
---------------------------------
---------------------------------
| explained_variance | -11.6    |
| fps                | 855      |
| nupdates           | 630200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3151000  |
| value_loss         | 0.000598 |
---------------------------------
---------------------------------
| explained_variance | -0.323   |
| fps                | 8

---------------------------------
| explained_variance | -11.2    |
| fps                | 855      |
| nupdates           | 633000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3165000  |
| value_loss         | 0.00065  |
---------------------------------
---------------------------------
| explained_variance | 0.978    |
| fps                | 855      |
| nupdates           | 633100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3165500  |
| value_loss         | 7.45e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 855      |
| nupdates           | 633200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3166000  |
| value_loss         | 1.58e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.151    |
| fps                | 855      |
| nupdates           | 633300   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.15    |
| fps                | 854      |
| nupdates           | 636000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3180000  |
| value_loss         | 3.41e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.573    |
| fps                | 854      |
| nupdates           | 636100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3180500  |
| value_loss         | 0.000182 |
---------------------------------
---------------------------------
| explained_variance | 0.0077   |
| fps                | 854      |
| nupdates           | 636200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3181000  |
| value_loss         | 1.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.909    |
| fps                | 854      |
| nupdates           | 636300   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.446   |
| fps                | 854      |
| nupdates           | 639100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3195500  |
| value_loss         | 4.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.175    |
| fps                | 854      |
| nupdates           | 639200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3196000  |
| value_loss         | 9.89e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.472   |
| fps                | 854      |
| nupdates           | 639300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3196500  |
| value_loss         | 0.000425 |
---------------------------------
---------------------------------
| explained_variance | -0.0133  |
| fps                | 854      |
| nupdates           | 639400   |
| policy_entropy     | 1.68     |
| total_timest

---------------------------------
| explained_variance | -0.388   |
| fps                | 853      |
| nupdates           | 642100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3210500  |
| value_loss         | 0.00012  |
---------------------------------
----------------------------------
| explained_variance | -9.64e+03 |
| fps                | 853       |
| nupdates           | 642200    |
| policy_entropy     | 1.86      |
| total_timesteps    | 3211000   |
| value_loss         | 0.141     |
----------------------------------
---------------------------------
| explained_variance | -0.128   |
| fps                | 853      |
| nupdates           | 642300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3211500  |
| value_loss         | 0.000375 |
---------------------------------
---------------------------------
| explained_variance | 0.892    |
| fps                | 853      |
| nupdates           | 642400   |
| policy_entropy     | 2.05     |
| tota

---------------------------------
| explained_variance | 0.931    |
| fps                | 852      |
| nupdates           | 645100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3225500  |
| value_loss         | 0.00015  |
---------------------------------
---------------------------------
| explained_variance | 0.618    |
| fps                | 852      |
| nupdates           | 645200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3226000  |
| value_loss         | 0.000213 |
---------------------------------
---------------------------------
| explained_variance | -1.05    |
| fps                | 852      |
| nupdates           | 645300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3226500  |
| value_loss         | 0.000192 |
---------------------------------
---------------------------------
| explained_variance | 0.353    |
| fps                | 852      |
| nupdates           | 645400   |
| policy_entropy     | 1.75     |
| total_timest

---------------------------------
| explained_variance | 0.553    |
| fps                | 852      |
| nupdates           | 648200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3241000  |
| value_loss         | 0.000134 |
---------------------------------
----------------------------------
| explained_variance | -8.93e+03 |
| fps                | 852       |
| nupdates           | 648300    |
| policy_entropy     | 2.02      |
| total_timesteps    | 3241500   |
| value_loss         | 0.153     |
----------------------------------
---------------------------------
| explained_variance | 0.818    |
| fps                | 852      |
| nupdates           | 648400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3242000  |
| value_loss         | 1.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.964    |
| fps                | 852      |
| nupdates           | 648500   |
| policy_entropy     | 2.08     |
| tota

---------------------------------
| explained_variance | -5.47    |
| fps                | 852      |
| nupdates           | 651200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3256000  |
| value_loss         | 0.000211 |
---------------------------------
---------------------------------
| explained_variance | -0.22    |
| fps                | 852      |
| nupdates           | 651300   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3256500  |
| value_loss         | 0.000753 |
---------------------------------
---------------------------------
| explained_variance | 0.844    |
| fps                | 852      |
| nupdates           | 651400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3257000  |
| value_loss         | 2.77e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.873    |
| fps                | 852      |
| nupdates           | 651500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.831    |
| fps                | 852      |
| nupdates           | 654300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3271500  |
| value_loss         | 4.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.316    |
| fps                | 852      |
| nupdates           | 654400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3272000  |
| value_loss         | 0.000104 |
---------------------------------
---------------------------------
| explained_variance | -11.2    |
| fps                | 852      |
| nupdates           | 654500   |
| policy_entropy     | 2.01     |
| total_timesteps    | 3272500  |
| value_loss         | 0.00233  |
---------------------------------
---------------------------------
| explained_variance | -0.182   |
| fps                | 852      |
| nupdates           | 654600   |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | -0.236   |
| fps                | 851      |
| nupdates           | 657300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3286500  |
| value_loss         | 0.000132 |
---------------------------------
---------------------------------
| explained_variance | 0.806    |
| fps                | 851      |
| nupdates           | 657400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3287000  |
| value_loss         | 2.51e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.545    |
| fps                | 851      |
| nupdates           | 657500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3287500  |
| value_loss         | 0.00133  |
---------------------------------
---------------------------------
| explained_variance | -0.232   |
| fps                | 851      |
| nupdates           | 657600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.438   |
| fps                | 850      |
| nupdates           | 660300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3301500  |
| value_loss         | 0.000369 |
---------------------------------
---------------------------------
| explained_variance | 0.592    |
| fps                | 850      |
| nupdates           | 660400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3302000  |
| value_loss         | 3.55e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.948   |
| fps                | 850      |
| nupdates           | 660500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3302500  |
| value_loss         | 0.00127  |
---------------------------------
---------------------------------
| explained_variance | 0.884    |
| fps                | 850      |
| nupdates           | 660600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.0804  |
| fps                | 850      |
| nupdates           | 663400   |
| policy_entropy     | 2        |
| total_timesteps    | 3317000  |
| value_loss         | 6.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.16    |
| fps                | 850      |
| nupdates           | 663500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3317500  |
| value_loss         | 7.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.978    |
| fps                | 850      |
| nupdates           | 663600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3318000  |
| value_loss         | 6.59e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 850      |
| nupdates           | 663700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.575    |
| fps                | 849      |
| nupdates           | 666400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3332000  |
| value_loss         | 0.000345 |
---------------------------------
---------------------------------
| explained_variance | 0.589    |
| fps                | 849      |
| nupdates           | 666500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3332500  |
| value_loss         | 0.000731 |
---------------------------------
---------------------------------
| explained_variance | 0.889    |
| fps                | 849      |
| nupdates           | 666600   |
| policy_entropy     | 1.94     |
| total_timesteps    | 3333000  |
| value_loss         | 0.000266 |
---------------------------------
---------------------------------
| explained_variance | -1.43    |
| fps                | 849      |
| nupdates           | 666700   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.956    |
| fps                | 849      |
| nupdates           | 669500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3347500  |
| value_loss         | 7.37e-06 |
---------------------------------
---------------------------------
| explained_variance | -2.5     |
| fps                | 849      |
| nupdates           | 669600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3348000  |
| value_loss         | 0.000159 |
---------------------------------
---------------------------------
| explained_variance | 0.945    |
| fps                | 849      |
| nupdates           | 669700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3348500  |
| value_loss         | 2.82e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.882    |
| fps                | 849      |
| nupdates           | 669800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.576    |
| fps                | 848      |
| nupdates           | 672500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3362500  |
| value_loss         | 4.44e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.19    |
| fps                | 848      |
| nupdates           | 672600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3363000  |
| value_loss         | 6.62e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.828    |
| fps                | 848      |
| nupdates           | 672700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3363500  |
| value_loss         | 0.000157 |
---------------------------------
---------------------------------
| explained_variance | -1.31    |
| fps                | 848      |
| nupdates           | 672800   |
| policy_entropy     | 1.71     |
| total_timest

---------------------------------
| explained_variance | -0.411   |
| fps                | 847      |
| nupdates           | 675500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3377500  |
| value_loss         | 0.00132  |
---------------------------------
---------------------------------
| explained_variance | 0.593    |
| fps                | 847      |
| nupdates           | 675600   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3378000  |
| value_loss         | 0.000205 |
---------------------------------
---------------------------------
| explained_variance | 0.918    |
| fps                | 847      |
| nupdates           | 675700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3378500  |
| value_loss         | 0.00022  |
---------------------------------
---------------------------------
| explained_variance | -13.8    |
| fps                | 847      |
| nupdates           | 675800   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.02    |
| fps                | 847      |
| nupdates           | 678600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3393000  |
| value_loss         | 0.000912 |
---------------------------------
---------------------------------
| explained_variance | -0.115   |
| fps                | 847      |
| nupdates           | 678700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3393500  |
| value_loss         | 0.000134 |
---------------------------------
---------------------------------
| explained_variance | 0.822    |
| fps                | 847      |
| nupdates           | 678800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3394000  |
| value_loss         | 2.7e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.862    |
| fps                | 847      |
| nupdates           | 678900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.984    |
| fps                | 846      |
| nupdates           | 681600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3408000  |
| value_loss         | 1.94e-05 |
---------------------------------
---------------------------------
| explained_variance | -24      |
| fps                | 846      |
| nupdates           | 681700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3408500  |
| value_loss         | 0.00446  |
---------------------------------
---------------------------------
| explained_variance | 0.946    |
| fps                | 846      |
| nupdates           | 681800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3409000  |
| value_loss         | 0.000104 |
---------------------------------
---------------------------------
| explained_variance | -0.496   |
| fps                | 846      |
| nupdates           | 681900   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.285   |
| fps                | 847      |
| nupdates           | 684700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3423500  |
| value_loss         | 0.00021  |
---------------------------------
---------------------------------
| explained_variance | 0.474    |
| fps                | 847      |
| nupdates           | 684800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3424000  |
| value_loss         | 0.93     |
---------------------------------
---------------------------------
| explained_variance | 0.457    |
| fps                | 847      |
| nupdates           | 684900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3424500  |
| value_loss         | 2.11e-05 |
---------------------------------
Eval num_timesteps=3425000, episode_reward=-4.90 +/- 0.30
Episode length: 550.70 +/- 62.56
---------------------------------
| explained_variance | -0.00338 |
| fps                | 84

---------------------------------
| explained_variance | -0.0468  |
| fps                | 846      |
| nupdates           | 687700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3438500  |
| value_loss         | 0.000291 |
---------------------------------
---------------------------------
| explained_variance | -0.132   |
| fps                | 846      |
| nupdates           | 687800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3439000  |
| value_loss         | 5.13e-05 |
---------------------------------
----------------------------------
| explained_variance | -1.26e+03 |
| fps                | 846       |
| nupdates           | 687900    |
| policy_entropy     | 1.99      |
| total_timesteps    | 3439500   |
| value_loss         | 0.0602    |
----------------------------------
---------------------------------
| explained_variance | 0.939    |
| fps                | 846      |
| nupdates           | 688000   |
| policy_entropy     | 2.05     |
| tota

---------------------------------
| explained_variance | 0.984    |
| fps                | 845      |
| nupdates           | 690700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3453500  |
| value_loss         | 0.0011   |
---------------------------------
---------------------------------
| explained_variance | 0.341    |
| fps                | 845      |
| nupdates           | 690800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3454000  |
| value_loss         | 0.174    |
---------------------------------
---------------------------------
| explained_variance | 0.663    |
| fps                | 845      |
| nupdates           | 690900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3454500  |
| value_loss         | 0.000371 |
---------------------------------
---------------------------------
| explained_variance | -2.25    |
| fps                | 845      |
| nupdates           | 691000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.366    |
| fps                | 844      |
| nupdates           | 693800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3469000  |
| value_loss         | 0.0997   |
---------------------------------
---------------------------------
| explained_variance | 0.798    |
| fps                | 844      |
| nupdates           | 693900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3469500  |
| value_loss         | 4.93e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.853    |
| fps                | 844      |
| nupdates           | 694000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3470000  |
| value_loss         | 5.09e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.795    |
| fps                | 844      |
| nupdates           | 694100   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.5     |
| fps                | 843      |
| nupdates           | 696800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3484000  |
| value_loss         | 1.19e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.531    |
| fps                | 843      |
| nupdates           | 696900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3484500  |
| value_loss         | 0.000138 |
---------------------------------
---------------------------------
| explained_variance | -46.8    |
| fps                | 843      |
| nupdates           | 697000   |
| policy_entropy     | 2.02     |
| total_timesteps    | 3485000  |
| value_loss         | 0.00186  |
---------------------------------
---------------------------------
| explained_variance | 0.358    |
| fps                | 843      |
| nupdates           | 697100   |
| policy_entropy     | 1.69     |
| total_timest

---------------------------------
| explained_variance | 0.734    |
| fps                | 843      |
| nupdates           | 699900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3499500  |
| value_loss         | 1.7e-05  |
---------------------------------
Eval num_timesteps=3500000, episode_reward=-5.00 +/- 0.00
Episode length: 583.00 +/- 145.64
---------------------------------
| explained_variance | 0.151    |
| fps                | 842      |
| nupdates           | 700000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3500000  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | -10.7    |
| fps                | 843      |
| nupdates           | 700100   |
| policy_entropy     | 1.81     |
| total_timesteps    | 3500500  |
| value_loss         | 0.00408  |
---------------------------------
---------------------------------
| explained_variance | -0.0309  |
| fps                | 8

---------------------------------
| explained_variance | 0.644    |
| fps                | 843      |
| nupdates           | 702900   |
| policy_entropy     | 1.86     |
| total_timesteps    | 3514500  |
| value_loss         | 0.000423 |
---------------------------------
---------------------------------
| explained_variance | 0.749    |
| fps                | 843      |
| nupdates           | 703000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3515000  |
| value_loss         | 4.78e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 843      |
| nupdates           | 703100   |
| policy_entropy     | 1.92     |
| total_timesteps    | 3515500  |
| value_loss         | 3.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.545    |
| fps                | 843      |
| nupdates           | 703200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.98     |
| fps                | 842      |
| nupdates           | 705900   |
| policy_entropy     | 1.02     |
| total_timesteps    | 3529500  |
| value_loss         | 0.000792 |
---------------------------------
---------------------------------
| explained_variance | 0.941    |
| fps                | 842      |
| nupdates           | 706000   |
| policy_entropy     | 2.01     |
| total_timesteps    | 3530000  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | 0.939    |
| fps                | 842      |
| nupdates           | 706100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3530500  |
| value_loss         | 3.82e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.591    |
| fps                | 842      |
| nupdates           | 706200   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.742    |
| fps                | 842      |
| nupdates           | 709000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3545000  |
| value_loss         | 2.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.00522  |
| fps                | 842      |
| nupdates           | 709100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3545500  |
| value_loss         | 0.000104 |
---------------------------------
---------------------------------
| explained_variance | 0.38     |
| fps                | 842      |
| nupdates           | 709200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3546000  |
| value_loss         | 2e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.641    |
| fps                | 842      |
| nupdates           | 709300   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -30.2    |
| fps                | 841      |
| nupdates           | 712000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3560000  |
| value_loss         | 0.00264  |
---------------------------------
---------------------------------
| explained_variance | 0.957    |
| fps                | 841      |
| nupdates           | 712100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3560500  |
| value_loss         | 3.65e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 841      |
| nupdates           | 712200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3561000  |
| value_loss         | 6.99e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 841      |
| nupdates           | 712300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.0307   |
| fps                | 841      |
| nupdates           | 715100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3575500  |
| value_loss         | 2.79e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.128    |
| fps                | 841      |
| nupdates           | 715200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3576000  |
| value_loss         | 0.00045  |
---------------------------------
---------------------------------
| explained_variance | -3.07    |
| fps                | 841      |
| nupdates           | 715300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3576500  |
| value_loss         | 0.000561 |
---------------------------------
---------------------------------
| explained_variance | -0.124   |
| fps                | 841      |
| nupdates           | 715400   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.04    |
| fps                | 841      |
| nupdates           | 718200   |
| policy_entropy     | 1.99     |
| total_timesteps    | 3591000  |
| value_loss         | 8.78e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.00193  |
| fps                | 841      |
| nupdates           | 718300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3591500  |
| value_loss         | 0.000366 |
---------------------------------
---------------------------------
| explained_variance | -10.9    |
| fps                | 841      |
| nupdates           | 718400   |
| policy_entropy     | 1.98     |
| total_timesteps    | 3592000  |
| value_loss         | 0.00149  |
---------------------------------
---------------------------------
| explained_variance | -6.73    |
| fps                | 841      |
| nupdates           | 718500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.966    |
| fps                | 840      |
| nupdates           | 721200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3606000  |
| value_loss         | 9.91e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.485    |
| fps                | 840      |
| nupdates           | 721300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3606500  |
| value_loss         | 0.000164 |
---------------------------------
---------------------------------
| explained_variance | 0.489    |
| fps                | 840      |
| nupdates           | 721400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3607000  |
| value_loss         | 0.000385 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 840      |
| nupdates           | 721500   |
| policy_entropy     | 2.06     |
| total_timest

----------------------------------
| explained_variance | -2.19e+04 |
| fps                | 840       |
| nupdates           | 724300    |
| policy_entropy     | 2.07      |
| total_timesteps    | 3621500   |
| value_loss         | 0.163     |
----------------------------------
---------------------------------
| explained_variance | 0.388    |
| fps                | 840      |
| nupdates           | 724400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3622000  |
| value_loss         | 5.72e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0436  |
| fps                | 840      |
| nupdates           | 724500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3622500  |
| value_loss         | 0.000171 |
---------------------------------
---------------------------------
| explained_variance | -0.409   |
| fps                | 840      |
| nupdates           | 724600   |
| policy_entropy     | 2.08     |
| tota

---------------------------------
| explained_variance | -45.2    |
| fps                | 839      |
| nupdates           | 727300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3636500  |
| value_loss         | 0.00438  |
---------------------------------
---------------------------------
| explained_variance | 0.285    |
| fps                | 839      |
| nupdates           | 727400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3637000  |
| value_loss         | 9e-05    |
---------------------------------
---------------------------------
| explained_variance | -6.77    |
| fps                | 839      |
| nupdates           | 727500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3637500  |
| value_loss         | 0.000112 |
---------------------------------
---------------------------------
| explained_variance | -0.919   |
| fps                | 839      |
| nupdates           | 727600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.204   |
| fps                | 839      |
| nupdates           | 730300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3651500  |
| value_loss         | 0.000536 |
---------------------------------
---------------------------------
| explained_variance | 0.57     |
| fps                | 839      |
| nupdates           | 730400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3652000  |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | 0.852    |
| fps                | 839      |
| nupdates           | 730500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3652500  |
| value_loss         | 3.75e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.764   |
| fps                | 839      |
| nupdates           | 730600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.987    |
| fps                | 839      |
| nupdates           | 733400   |
| policy_entropy     | 1.98     |
| total_timesteps    | 3667000  |
| value_loss         | 0.00114  |
---------------------------------
---------------------------------
| explained_variance | 0.355    |
| fps                | 839      |
| nupdates           | 733500   |
| policy_entropy     | 1.96     |
| total_timesteps    | 3667500  |
| value_loss         | 0.166    |
---------------------------------
---------------------------------
| explained_variance | 0.44     |
| fps                | 839      |
| nupdates           | 733600   |
| policy_entropy     | 2.02     |
| total_timesteps    | 3668000  |
| value_loss         | 3.37e-05 |
---------------------------------
---------------------------------
| explained_variance | -174     |
| fps                | 839      |
| nupdates           | 733700   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.2e+03 |
| fps                | 838      |
| nupdates           | 736400   |
| policy_entropy     | 2.02     |
| total_timesteps    | 3682000  |
| value_loss         | 0.0659   |
---------------------------------
---------------------------------
| explained_variance | 0.424    |
| fps                | 838      |
| nupdates           | 736500   |
| policy_entropy     | 1.97     |
| total_timesteps    | 3682500  |
| value_loss         | 0.138    |
---------------------------------
---------------------------------
| explained_variance | -1.03    |
| fps                | 838      |
| nupdates           | 736600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3683000  |
| value_loss         | 9.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.87     |
| fps                | 838      |
| nupdates           | 736700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.621    |
| fps                | 838      |
| nupdates           | 739500   |
| policy_entropy     | 1.99     |
| total_timesteps    | 3697500  |
| value_loss         | 3.64e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.879    |
| fps                | 838      |
| nupdates           | 739600   |
| policy_entropy     | 1.96     |
| total_timesteps    | 3698000  |
| value_loss         | 0.000135 |
---------------------------------
---------------------------------
| explained_variance | 0.284    |
| fps                | 838      |
| nupdates           | 739700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3698500  |
| value_loss         | 0.000223 |
---------------------------------
---------------------------------
| explained_variance | 0.915    |
| fps                | 838      |
| nupdates           | 739800   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.204    |
| fps                | 838      |
| nupdates           | 742500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3712500  |
| value_loss         | 0.000469 |
---------------------------------
---------------------------------
| explained_variance | 0.819    |
| fps                | 838      |
| nupdates           | 742600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3713000  |
| value_loss         | 6.66e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.328    |
| fps                | 838      |
| nupdates           | 742700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3713500  |
| value_loss         | 0.000242 |
---------------------------------
---------------------------------
| explained_variance | -0.0619  |
| fps                | 838      |
| nupdates           | 742800   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.599    |
| fps                | 837      |
| nupdates           | 745500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3727500  |
| value_loss         | 2.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -10.5    |
| fps                | 837      |
| nupdates           | 745600   |
| policy_entropy     | 1.72     |
| total_timesteps    | 3728000  |
| value_loss         | 0.00144  |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 837      |
| nupdates           | 745700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3728500  |
| value_loss         | 7.59e-06 |
---------------------------------
---------------------------------
| explained_variance | -8.79    |
| fps                | 837      |
| nupdates           | 745800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -12.1    |
| fps                | 837      |
| nupdates           | 748600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3743000  |
| value_loss         | 0.000612 |
---------------------------------
---------------------------------
| explained_variance | 0.502    |
| fps                | 837      |
| nupdates           | 748700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3743500  |
| value_loss         | 9.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.327    |
| fps                | 837      |
| nupdates           | 748800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3744000  |
| value_loss         | 0.00164  |
---------------------------------
---------------------------------
| explained_variance | 0.958    |
| fps                | 837      |
| nupdates           | 748900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.852    |
| fps                | 836      |
| nupdates           | 751600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3758000  |
| value_loss         | 5.51e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.768   |
| fps                | 836      |
| nupdates           | 751700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3758500  |
| value_loss         | 0.000188 |
---------------------------------
---------------------------------
| explained_variance | -0.482   |
| fps                | 836      |
| nupdates           | 751800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3759000  |
| value_loss         | 3.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 836      |
| nupdates           | 751900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0384  |
| fps                | 837      |
| nupdates           | 754700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3773500  |
| value_loss         | 4.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.422    |
| fps                | 837      |
| nupdates           | 754800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3774000  |
| value_loss         | 0.000138 |
---------------------------------
---------------------------------
| explained_variance | 0.386    |
| fps                | 837      |
| nupdates           | 754900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3774500  |
| value_loss         | 7.12e-05 |
---------------------------------
Eval num_timesteps=3775000, episode_reward=-4.90 +/- 0.30
Episode length: 607.30 +/- 91.43
---------------------------------
| explained_variance | 0.451    |
| fps                | 83

---------------------------------
| explained_variance | 0.926    |
| fps                | 836      |
| nupdates           | 757700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3788500  |
| value_loss         | 6.29e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.136    |
| fps                | 836      |
| nupdates           | 757800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3789000  |
| value_loss         | 5.31e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.39    |
| fps                | 836      |
| nupdates           | 757900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3789500  |
| value_loss         | 0.000587 |
---------------------------------
---------------------------------
| explained_variance | -43.1    |
| fps                | 836      |
| nupdates           | 758000   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.211   |
| fps                | 835      |
| nupdates           | 760700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3803500  |
| value_loss         | 0.000543 |
---------------------------------
---------------------------------
| explained_variance | 0.396    |
| fps                | 835      |
| nupdates           | 760800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3804000  |
| value_loss         | 9.96e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.725    |
| fps                | 835      |
| nupdates           | 760900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3804500  |
| value_loss         | 5.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.859    |
| fps                | 835      |
| nupdates           | 761000   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.784    |
| fps                | 835      |
| nupdates           | 763800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3819000  |
| value_loss         | 0.00026  |
---------------------------------
---------------------------------
| explained_variance | -2.07    |
| fps                | 835      |
| nupdates           | 763900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3819500  |
| value_loss         | 8.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.89     |
| fps                | 835      |
| nupdates           | 764000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3820000  |
| value_loss         | 0.000208 |
---------------------------------
---------------------------------
| explained_variance | 0.975    |
| fps                | 835      |
| nupdates           | 764100   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.94     |
| fps                | 834      |
| nupdates           | 766800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3834000  |
| value_loss         | 1.29e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.625    |
| fps                | 834      |
| nupdates           | 766900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3834500  |
| value_loss         | 0.00018  |
---------------------------------
---------------------------------
| explained_variance | 0.968    |
| fps                | 834      |
| nupdates           | 767000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3835000  |
| value_loss         | 5.96e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.973    |
| fps                | 834      |
| nupdates           | 767100   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.00717 |
| fps                | 835      |
| nupdates           | 769900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3849500  |
| value_loss         | 0.000339 |
---------------------------------
Eval num_timesteps=3850000, episode_reward=-4.50 +/- 1.20
Episode length: 574.10 +/- 122.61
---------------------------------
| explained_variance | 0.0402   |
| fps                | 834      |
| nupdates           | 770000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3850000  |
| value_loss         | 0.000387 |
---------------------------------
---------------------------------
| explained_variance | 0.742    |
| fps                | 834      |
| nupdates           | 770100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3850500  |
| value_loss         | 0.000169 |
---------------------------------
---------------------------------
| explained_variance | 0.362    |
| fps                | 8

---------------------------------
| explained_variance | -2.01    |
| fps                | 834      |
| nupdates           | 772900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3864500  |
| value_loss         | 7.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.921    |
| fps                | 834      |
| nupdates           | 773000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3865000  |
| value_loss         | 1.78e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.12    |
| fps                | 834      |
| nupdates           | 773100   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3865500  |
| value_loss         | 0.00494  |
---------------------------------
---------------------------------
| explained_variance | 0.157    |
| fps                | 834      |
| nupdates           | 773200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0366   |
| fps                | 833      |
| nupdates           | 775900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3879500  |
| value_loss         | 8.1e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.0466  |
| fps                | 833      |
| nupdates           | 776000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3880000  |
| value_loss         | 0.000176 |
---------------------------------
---------------------------------
| explained_variance | 0.799    |
| fps                | 833      |
| nupdates           | 776100   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3880500  |
| value_loss         | 0.000508 |
---------------------------------
---------------------------------
| explained_variance | -0.0361  |
| fps                | 833      |
| nupdates           | 776200   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.951    |
| fps                | 833      |
| nupdates           | 779000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3895000  |
| value_loss         | 1.08e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.516    |
| fps                | 833      |
| nupdates           | 779100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3895500  |
| value_loss         | 0.000166 |
---------------------------------
---------------------------------
| explained_variance | 0.427    |
| fps                | 833      |
| nupdates           | 779200   |
| policy_entropy     | 2.01     |
| total_timesteps    | 3896000  |
| value_loss         | 0.000292 |
---------------------------------
---------------------------------
| explained_variance | 0.709    |
| fps                | 833      |
| nupdates           | 779300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.702    |
| fps                | 832      |
| nupdates           | 782000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3910000  |
| value_loss         | 6.67e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.66     |
| fps                | 832      |
| nupdates           | 782100   |
| policy_entropy     | 2.08     |
| total_timesteps    | 3910500  |
| value_loss         | 0.000117 |
---------------------------------
---------------------------------
| explained_variance | 0.209    |
| fps                | 832      |
| nupdates           | 782200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3911000  |
| value_loss         | 0.000279 |
---------------------------------
---------------------------------
| explained_variance | 0.511    |
| fps                | 832      |
| nupdates           | 782300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.228    |
| fps                | 832      |
| nupdates           | 785100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3925500  |
| value_loss         | 6.35e-05 |
---------------------------------
---------------------------------
| explained_variance | -5.81    |
| fps                | 832      |
| nupdates           | 785200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3926000  |
| value_loss         | 0.00197  |
---------------------------------
---------------------------------
| explained_variance | 0.585    |
| fps                | 832      |
| nupdates           | 785300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3926500  |
| value_loss         | 2.78e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.655    |
| fps                | 832      |
| nupdates           | 785400   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.937    |
| fps                | 832      |
| nupdates           | 788200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3941000  |
| value_loss         | 9.53e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.765    |
| fps                | 832      |
| nupdates           | 788300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3941500  |
| value_loss         | 2.05e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.34    |
| fps                | 832      |
| nupdates           | 788400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 3942000  |
| value_loss         | 0.000636 |
---------------------------------
---------------------------------
| explained_variance | 0.0873   |
| fps                | 832      |
| nupdates           | 788500   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.382   |
| fps                | 831      |
| nupdates           | 791200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 3956000  |
| value_loss         | 0.000181 |
---------------------------------
---------------------------------
| explained_variance | -11      |
| fps                | 831      |
| nupdates           | 791300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3956500  |
| value_loss         | 0.00045  |
---------------------------------
---------------------------------
| explained_variance | 0.965    |
| fps                | 831      |
| nupdates           | 791400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 3957000  |
| value_loss         | 7.35e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.52    |
| fps                | 831      |
| nupdates           | 791500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.455    |
| fps                | 831      |
| nupdates           | 794300   |
| policy_entropy     | 2.02     |
| total_timesteps    | 3971500  |
| value_loss         | 0.000646 |
---------------------------------
---------------------------------
| explained_variance | -3.29    |
| fps                | 831      |
| nupdates           | 794400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3972000  |
| value_loss         | 7.28e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.54    |
| fps                | 831      |
| nupdates           | 794500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 3972500  |
| value_loss         | 0.000244 |
---------------------------------
---------------------------------
| explained_variance | 0.93     |
| fps                | 831      |
| nupdates           | 794600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -432     |
| fps                | 831      |
| nupdates           | 797300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 3986500  |
| value_loss         | 0.0126   |
---------------------------------
---------------------------------
| explained_variance | -1.46    |
| fps                | 831      |
| nupdates           | 797400   |
| policy_entropy     | 2.02     |
| total_timesteps    | 3987000  |
| value_loss         | 0.00168  |
---------------------------------
---------------------------------
| explained_variance | 0.916    |
| fps                | 831      |
| nupdates           | 797500   |
| policy_entropy     | 2        |
| total_timesteps    | 3987500  |
| value_loss         | 3.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 831      |
| nupdates           | 797600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.97     |
| fps                | 830      |
| nupdates           | 800300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4001500  |
| value_loss         | 4.56e-06 |
---------------------------------
---------------------------------
| explained_variance | -7.96    |
| fps                | 830      |
| nupdates           | 800400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4002000  |
| value_loss         | 0.00295  |
---------------------------------
---------------------------------
| explained_variance | 0.721    |
| fps                | 830      |
| nupdates           | 800500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4002500  |
| value_loss         | 6.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0566   |
| fps                | 830      |
| nupdates           | 800600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -4.12    |
| fps                | 830      |
| nupdates           | 803400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4017000  |
| value_loss         | 0.000175 |
---------------------------------
---------------------------------
| explained_variance | 0.475    |
| fps                | 830      |
| nupdates           | 803500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4017500  |
| value_loss         | 2.35e-05 |
---------------------------------
---------------------------------
| explained_variance | -9.67    |
| fps                | 830      |
| nupdates           | 803600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4018000  |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | -1.13    |
| fps                | 830      |
| nupdates           | 803700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0357  |
| fps                | 830      |
| nupdates           | 806400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4032000  |
| value_loss         | 7.29e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.11    |
| fps                | 830      |
| nupdates           | 806500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4032500  |
| value_loss         | 8.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.805    |
| fps                | 830      |
| nupdates           | 806600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4033000  |
| value_loss         | 2.38e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.678    |
| fps                | 830      |
| nupdates           | 806700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0933   |
| fps                | 830      |
| nupdates           | 809500   |
| policy_entropy     | 1.98     |
| total_timesteps    | 4047500  |
| value_loss         | 9.78e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.88    |
| fps                | 830      |
| nupdates           | 809600   |
| policy_entropy     | 1.96     |
| total_timesteps    | 4048000  |
| value_loss         | 0.000229 |
---------------------------------
---------------------------------
| explained_variance | -0.516   |
| fps                | 830      |
| nupdates           | 809700   |
| policy_entropy     | 2        |
| total_timesteps    | 4048500  |
| value_loss         | 0.00108  |
---------------------------------
---------------------------------
| explained_variance | 0.847    |
| fps                | 830      |
| nupdates           | 809800   |
| policy_entropy     | 1.93     |
| total_timest

---------------------------------
| explained_variance | 0.8      |
| fps                | 829      |
| nupdates           | 812500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4062500  |
| value_loss         | 2.35e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.068    |
| fps                | 829      |
| nupdates           | 812600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4063000  |
| value_loss         | 0.000436 |
---------------------------------
---------------------------------
| explained_variance | 0.665    |
| fps                | 829      |
| nupdates           | 812700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4063500  |
| value_loss         | 0.000248 |
---------------------------------
---------------------------------
| explained_variance | 0.24     |
| fps                | 829      |
| nupdates           | 812800   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -0.0544  |
| fps                | 828      |
| nupdates           | 815500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4077500  |
| value_loss         | 0.000398 |
---------------------------------
---------------------------------
| explained_variance | -3.93    |
| fps                | 828      |
| nupdates           | 815600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4078000  |
| value_loss         | 0.000259 |
---------------------------------
---------------------------------
| explained_variance | -2.69    |
| fps                | 828      |
| nupdates           | 815700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4078500  |
| value_loss         | 0.000264 |
---------------------------------
---------------------------------
| explained_variance | 0.203    |
| fps                | 828      |
| nupdates           | 815800   |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.57     |
| fps                | 828      |
| nupdates           | 818600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4093000  |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | -8.25    |
| fps                | 828      |
| nupdates           | 818700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4093500  |
| value_loss         | 0.00127  |
---------------------------------
---------------------------------
| explained_variance | 0.868    |
| fps                | 828      |
| nupdates           | 818800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4094000  |
| value_loss         | 1.97e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.23    |
| fps                | 828      |
| nupdates           | 818900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.98    |
| fps                | 828      |
| nupdates           | 821600   |
| policy_entropy     | 2.01     |
| total_timesteps    | 4108000  |
| value_loss         | 0.000181 |
---------------------------------
---------------------------------
| explained_variance | 0.31     |
| fps                | 828      |
| nupdates           | 821700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4108500  |
| value_loss         | 3.01e-05 |
---------------------------------
---------------------------------
| explained_variance | -15.6    |
| fps                | 828      |
| nupdates           | 821800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4109000  |
| value_loss         | 0.00558  |
---------------------------------
---------------------------------
| explained_variance | 0.451    |
| fps                | 828      |
| nupdates           | 821900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.482    |
| fps                | 828      |
| nupdates           | 824700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4123500  |
| value_loss         | 1.33e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.209   |
| fps                | 828      |
| nupdates           | 824800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4124000  |
| value_loss         | 0.000165 |
---------------------------------
---------------------------------
| explained_variance | 0.888    |
| fps                | 828      |
| nupdates           | 824900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4124500  |
| value_loss         | 3.22e-05 |
---------------------------------
Eval num_timesteps=4125000, episode_reward=-5.00 +/- 0.00
Episode length: 587.20 +/- 152.43
---------------------------------
| explained_variance | 0.902    |
| fps                | 8

---------------------------------
| explained_variance | -0.481   |
| fps                | 828      |
| nupdates           | 827700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4138500  |
| value_loss         | 0.000894 |
---------------------------------
---------------------------------
| explained_variance | -3.11    |
| fps                | 828      |
| nupdates           | 827800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4139000  |
| value_loss         | 0.000407 |
---------------------------------
---------------------------------
| explained_variance | 0.949    |
| fps                | 828      |
| nupdates           | 827900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4139500  |
| value_loss         | 2.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 828      |
| nupdates           | 828000   |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.38     |
| fps                | 827      |
| nupdates           | 830700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4153500  |
| value_loss         | 0.000289 |
---------------------------------
---------------------------------
| explained_variance | 0.976    |
| fps                | 827      |
| nupdates           | 830800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4154000  |
| value_loss         | 0.000554 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 827      |
| nupdates           | 830900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4154500  |
| value_loss         | 8.87e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.693    |
| fps                | 827      |
| nupdates           | 831000   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.855    |
| fps                | 828      |
| nupdates           | 833800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4169000  |
| value_loss         | 2.16e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.686    |
| fps                | 828      |
| nupdates           | 833900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4169500  |
| value_loss         | 0.000244 |
---------------------------------
---------------------------------
| explained_variance | -2.2     |
| fps                | 828      |
| nupdates           | 834000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4170000  |
| value_loss         | 9.03e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.28     |
| fps                | 828      |
| nupdates           | 834100   |
| policy_entropy     | 1.86     |
| total_timest

---------------------------------
| explained_variance | 0.383    |
| fps                | 827      |
| nupdates           | 836800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4184000  |
| value_loss         | 2.21e-05 |
---------------------------------
---------------------------------
| explained_variance | -12.3    |
| fps                | 827      |
| nupdates           | 836900   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4184500  |
| value_loss         | 0.000533 |
---------------------------------
---------------------------------
| explained_variance | 0.701    |
| fps                | 827      |
| nupdates           | 837000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4185000  |
| value_loss         | 0.000162 |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 827      |
| nupdates           | 837100   |
| policy_entropy     | 1.59     |
| total_timest

---------------------------------
| explained_variance | -0.125   |
| fps                | 827      |
| nupdates           | 839900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4199500  |
| value_loss         | 0.000332 |
---------------------------------
Eval num_timesteps=4200000, episode_reward=-4.60 +/- 0.49
Episode length: 670.10 +/- 83.91
---------------------------------
| explained_variance | -1.75    |
| fps                | 827      |
| nupdates           | 840000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4200000  |
| value_loss         | 0.000341 |
---------------------------------
---------------------------------
| explained_variance | 0.926    |
| fps                | 827      |
| nupdates           | 840100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4200500  |
| value_loss         | 1.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.717    |
| fps                | 82

---------------------------------
| explained_variance | 0.975    |
| fps                | 827      |
| nupdates           | 842900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4214500  |
| value_loss         | 2.66e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.49    |
| fps                | 827      |
| nupdates           | 843000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4215000  |
| value_loss         | 0.000572 |
---------------------------------
---------------------------------
| explained_variance | -1.61    |
| fps                | 827      |
| nupdates           | 843100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4215500  |
| value_loss         | 0.000316 |
---------------------------------
---------------------------------
| explained_variance | 0.573    |
| fps                | 827      |
| nupdates           | 843200   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -8.7     |
| fps                | 827      |
| nupdates           | 845900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4229500  |
| value_loss         | 8.07e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.105   |
| fps                | 827      |
| nupdates           | 846000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4230000  |
| value_loss         | 0.000132 |
---------------------------------
---------------------------------
| explained_variance | -0.391   |
| fps                | 827      |
| nupdates           | 846100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4230500  |
| value_loss         | 2.66e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.371    |
| fps                | 827      |
| nupdates           | 846200   |
| policy_entropy     | 1.48     |
| total_timest

---------------------------------
| explained_variance | -6.63    |
| fps                | 827      |
| nupdates           | 849000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4245000  |
| value_loss         | 0.000219 |
---------------------------------
---------------------------------
| explained_variance | 0.681    |
| fps                | 827      |
| nupdates           | 849100   |
| policy_entropy     | 1.32     |
| total_timesteps    | 4245500  |
| value_loss         | 0.000324 |
---------------------------------
---------------------------------
| explained_variance | -26.6    |
| fps                | 827      |
| nupdates           | 849200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4246000  |
| value_loss         | 0.00574  |
---------------------------------
---------------------------------
| explained_variance | 0.813    |
| fps                | 827      |
| nupdates           | 849300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.115   |
| fps                | 827      |
| nupdates           | 852000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4260000  |
| value_loss         | 0.00015  |
---------------------------------
---------------------------------
| explained_variance | -1.8     |
| fps                | 827      |
| nupdates           | 852100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4260500  |
| value_loss         | 0.00289  |
---------------------------------
---------------------------------
| explained_variance | 0.658    |
| fps                | 827      |
| nupdates           | 852200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4261000  |
| value_loss         | 0.000297 |
---------------------------------
---------------------------------
| explained_variance | -1.32    |
| fps                | 827      |
| nupdates           | 852300   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -4.63    |
| fps                | 826      |
| nupdates           | 855100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4275500  |
| value_loss         | 0.00118  |
---------------------------------
---------------------------------
| explained_variance | -30.7    |
| fps                | 826      |
| nupdates           | 855200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4276000  |
| value_loss         | 0.000311 |
---------------------------------
---------------------------------
| explained_variance | 0.92     |
| fps                | 826      |
| nupdates           | 855300   |
| policy_entropy     | 1.79     |
| total_timesteps    | 4276500  |
| value_loss         | 0.00218  |
---------------------------------
---------------------------------
| explained_variance | 0.937    |
| fps                | 826      |
| nupdates           | 855400   |
| policy_entropy     | 1.91     |
| total_timest

---------------------------------
| explained_variance | -35.3    |
| fps                | 826      |
| nupdates           | 858200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4291000  |
| value_loss         | 0.0279   |
---------------------------------
---------------------------------
| explained_variance | 0.976    |
| fps                | 826      |
| nupdates           | 858300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4291500  |
| value_loss         | 6.33e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.944    |
| fps                | 826      |
| nupdates           | 858400   |
| policy_entropy     | 1.93     |
| total_timesteps    | 4292000  |
| value_loss         | 0.000196 |
---------------------------------
---------------------------------
| explained_variance | 0.923    |
| fps                | 826      |
| nupdates           | 858500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.92     |
| fps                | 826      |
| nupdates           | 861200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4306000  |
| value_loss         | 3.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.22     |
| fps                | 826      |
| nupdates           | 861300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4306500  |
| value_loss         | 2.46e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.824    |
| fps                | 826      |
| nupdates           | 861400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4307000  |
| value_loss         | 6.31e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.763    |
| fps                | 826      |
| nupdates           | 861500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.44    |
| fps                | 826      |
| nupdates           | 864300   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4321500  |
| value_loss         | 5.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.32     |
| fps                | 826      |
| nupdates           | 864400   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4322000  |
| value_loss         | 0.109    |
---------------------------------
---------------------------------
| explained_variance | 0.407    |
| fps                | 826      |
| nupdates           | 864500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4322500  |
| value_loss         | 0.148    |
---------------------------------
---------------------------------
| explained_variance | 0.87     |
| fps                | 826      |
| nupdates           | 864600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.934    |
| fps                | 826      |
| nupdates           | 867300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4336500  |
| value_loss         | 3.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.503    |
| fps                | 826      |
| nupdates           | 867400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4337000  |
| value_loss         | 0.000146 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 826      |
| nupdates           | 867500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4337500  |
| value_loss         | 6.01e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.383    |
| fps                | 826      |
| nupdates           | 867600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.443    |
| fps                | 825      |
| nupdates           | 870300   |
| policy_entropy     | 1.87     |
| total_timesteps    | 4351500  |
| value_loss         | 0.92     |
---------------------------------
---------------------------------
| explained_variance | 0.864    |
| fps                | 825      |
| nupdates           | 870400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4352000  |
| value_loss         | 3.24e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.281   |
| fps                | 825      |
| nupdates           | 870500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4352500  |
| value_loss         | 0.000264 |
---------------------------------
---------------------------------
| explained_variance | 0.971    |
| fps                | 825      |
| nupdates           | 870600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0236  |
| fps                | 826      |
| nupdates           | 873400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4367000  |
| value_loss         | 0.000193 |
---------------------------------
---------------------------------
| explained_variance | 0.671    |
| fps                | 826      |
| nupdates           | 873500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4367500  |
| value_loss         | 5.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.0604   |
| fps                | 826      |
| nupdates           | 873600   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4368000  |
| value_loss         | 9.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.933    |
| fps                | 826      |
| nupdates           | 873700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.979    |
| fps                | 825      |
| nupdates           | 876400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4382000  |
| value_loss         | 4.51e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.695    |
| fps                | 825      |
| nupdates           | 876500   |
| policy_entropy     | 1.98     |
| total_timesteps    | 4382500  |
| value_loss         | 0.00231  |
---------------------------------
---------------------------------
| explained_variance | 0.975    |
| fps                | 825      |
| nupdates           | 876600   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4383000  |
| value_loss         | 2.37e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.27    |
| fps                | 825      |
| nupdates           | 876700   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -0.0166  |
| fps                | 826      |
| nupdates           | 879500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4397500  |
| value_loss         | 0.157    |
---------------------------------
---------------------------------
| explained_variance | -2.04    |
| fps                | 826      |
| nupdates           | 879600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4398000  |
| value_loss         | 2.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 826      |
| nupdates           | 879700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4398500  |
| value_loss         | 0.000221 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 826      |
| nupdates           | 879800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.821    |
| fps                | 825      |
| nupdates           | 882500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4412500  |
| value_loss         | 0.000128 |
---------------------------------
---------------------------------
| explained_variance | 0.925    |
| fps                | 825      |
| nupdates           | 882600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4413000  |
| value_loss         | 2.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.091   |
| fps                | 825      |
| nupdates           | 882700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4413500  |
| value_loss         | 0.000181 |
---------------------------------
---------------------------------
| explained_variance | -0.066   |
| fps                | 825      |
| nupdates           | 882800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.68     |
| fps                | 825      |
| nupdates           | 885500   |
| policy_entropy     | 2        |
| total_timesteps    | 4427500  |
| value_loss         | 0.000244 |
---------------------------------
---------------------------------
| explained_variance | 0.16     |
| fps                | 825      |
| nupdates           | 885600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4428000  |
| value_loss         | 3.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.351    |
| fps                | 825      |
| nupdates           | 885700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4428500  |
| value_loss         | 1.55e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.198    |
| fps                | 825      |
| nupdates           | 885800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.889    |
| fps                | 825      |
| nupdates           | 888600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4443000  |
| value_loss         | 2.34e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.0193  |
| fps                | 825      |
| nupdates           | 888700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4443500  |
| value_loss         | 0.552    |
---------------------------------
---------------------------------
| explained_variance | -0.762   |
| fps                | 825      |
| nupdates           | 888800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4444000  |
| value_loss         | 0.000405 |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 825      |
| nupdates           | 888900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.54    |
| fps                | 825      |
| nupdates           | 891600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4458000  |
| value_loss         | 0.000248 |
---------------------------------
---------------------------------
| explained_variance | 0.539    |
| fps                | 825      |
| nupdates           | 891700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4458500  |
| value_loss         | 6.37e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.705   |
| fps                | 825      |
| nupdates           | 891800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4459000  |
| value_loss         | 0.00072  |
---------------------------------
---------------------------------
| explained_variance | 0.811    |
| fps                | 825      |
| nupdates           | 891900   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -0.187   |
| fps                | 825      |
| nupdates           | 894700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4473500  |
| value_loss         | 1.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.44     |
| fps                | 825      |
| nupdates           | 894800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4474000  |
| value_loss         | 0.000693 |
---------------------------------
---------------------------------
| explained_variance | 0.921    |
| fps                | 825      |
| nupdates           | 894900   |
| policy_entropy     | 2        |
| total_timesteps    | 4474500  |
| value_loss         | 9.87e-06 |
---------------------------------
Eval num_timesteps=4475000, episode_reward=-4.70 +/- 0.46
Episode length: 597.40 +/- 137.85
---------------------------------
| explained_variance | -63.9    |
| fps                | 8

---------------------------------
| explained_variance | 0.952    |
| fps                | 825      |
| nupdates           | 897700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4488500  |
| value_loss         | 0.000282 |
---------------------------------
---------------------------------
| explained_variance | 0.0972   |
| fps                | 825      |
| nupdates           | 897800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4489000  |
| value_loss         | 8.52e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.594    |
| fps                | 825      |
| nupdates           | 897900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4489500  |
| value_loss         | 6.29e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.489    |
| fps                | 825      |
| nupdates           | 898000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.714    |
| fps                | 825      |
| nupdates           | 900700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4503500  |
| value_loss         | 0.000124 |
---------------------------------
---------------------------------
| explained_variance | 0.952    |
| fps                | 825      |
| nupdates           | 900800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4504000  |
| value_loss         | 9.98e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.553    |
| fps                | 825      |
| nupdates           | 900900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4504500  |
| value_loss         | 0.000528 |
---------------------------------
---------------------------------
| explained_variance | -0.838   |
| fps                | 825      |
| nupdates           | 901000   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.241    |
| fps                | 825      |
| nupdates           | 903800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4519000  |
| value_loss         | 0.000297 |
---------------------------------
---------------------------------
| explained_variance | 0.942    |
| fps                | 825      |
| nupdates           | 903900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4519500  |
| value_loss         | 3.89e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.104   |
| fps                | 825      |
| nupdates           | 904000   |
| policy_entropy     | 1.91     |
| total_timesteps    | 4520000  |
| value_loss         | 0.000183 |
---------------------------------
---------------------------------
| explained_variance | -0.662   |
| fps                | 825      |
| nupdates           | 904100   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.0214  |
| fps                | 825      |
| nupdates           | 906800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4534000  |
| value_loss         | 0.166    |
---------------------------------
---------------------------------
| explained_variance | -2.59    |
| fps                | 825      |
| nupdates           | 906900   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4534500  |
| value_loss         | 0.00206  |
---------------------------------
---------------------------------
| explained_variance | -1.38    |
| fps                | 825      |
| nupdates           | 907000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4535000  |
| value_loss         | 0.00858  |
---------------------------------
---------------------------------
| explained_variance | 0.241    |
| fps                | 825      |
| nupdates           | 907100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.943    |
| fps                | 825      |
| nupdates           | 909900   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4549500  |
| value_loss         | 1.48e-05 |
---------------------------------
Eval num_timesteps=4550000, episode_reward=-4.70 +/- 0.64
Episode length: 620.90 +/- 151.82
---------------------------------
| explained_variance | 0.988    |
| fps                | 824      |
| nupdates           | 910000   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4550000  |
| value_loss         | 9.33e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.84     |
| fps                | 824      |
| nupdates           | 910100   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4550500  |
| value_loss         | 4.6e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.375    |
| fps                | 8

---------------------------------
| explained_variance | 0.891    |
| fps                | 825      |
| nupdates           | 912900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4564500  |
| value_loss         | 2.74e-05 |
---------------------------------
---------------------------------
| explained_variance | -5.81    |
| fps                | 825      |
| nupdates           | 913000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4565000  |
| value_loss         | 0.000159 |
---------------------------------
---------------------------------
| explained_variance | -47.9    |
| fps                | 825      |
| nupdates           | 913100   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4565500  |
| value_loss         | 0.00612  |
---------------------------------
---------------------------------
| explained_variance | 0.307    |
| fps                | 825      |
| nupdates           | 913200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.21    |
| fps                | 824      |
| nupdates           | 915900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4579500  |
| value_loss         | 0.00086  |
---------------------------------
---------------------------------
| explained_variance | -11.6    |
| fps                | 825      |
| nupdates           | 916000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4580000  |
| value_loss         | 0.00329  |
---------------------------------
---------------------------------
| explained_variance | 0.345    |
| fps                | 825      |
| nupdates           | 916100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4580500  |
| value_loss         | 0.00037  |
---------------------------------
---------------------------------
| explained_variance | 0.992    |
| fps                | 825      |
| nupdates           | 916200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.719    |
| fps                | 825      |
| nupdates           | 919000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4595000  |
| value_loss         | 8.96e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.802   |
| fps                | 825      |
| nupdates           | 919100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4595500  |
| value_loss         | 0.000386 |
---------------------------------
---------------------------------
| explained_variance | -1.85    |
| fps                | 825      |
| nupdates           | 919200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4596000  |
| value_loss         | 0.000164 |
---------------------------------
---------------------------------
| explained_variance | -0.543   |
| fps                | 825      |
| nupdates           | 919300   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.769    |
| fps                | 825      |
| nupdates           | 922000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4610000  |
| value_loss         | 5.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.623    |
| fps                | 825      |
| nupdates           | 922100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4610500  |
| value_loss         | 0.000253 |
---------------------------------
---------------------------------
| explained_variance | 0.922    |
| fps                | 825      |
| nupdates           | 922200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4611000  |
| value_loss         | 4.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.708    |
| fps                | 825      |
| nupdates           | 922300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.981    |
| fps                | 824      |
| nupdates           | 925100   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4625500  |
| value_loss         | 0.00442  |
---------------------------------
---------------------------------
| explained_variance | 0.272    |
| fps                | 824      |
| nupdates           | 925200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4626000  |
| value_loss         | 0.000522 |
---------------------------------
---------------------------------
| explained_variance | -0.55    |
| fps                | 824      |
| nupdates           | 925300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4626500  |
| value_loss         | 0.000283 |
---------------------------------
---------------------------------
| explained_variance | 0.77     |
| fps                | 824      |
| nupdates           | 925400   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.965    |
| fps                | 825      |
| nupdates           | 928200   |
| policy_entropy     | 2        |
| total_timesteps    | 4641000  |
| value_loss         | 1.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.342    |
| fps                | 825      |
| nupdates           | 928300   |
| policy_entropy     | 1.92     |
| total_timesteps    | 4641500  |
| value_loss         | 0.182    |
---------------------------------
---------------------------------
| explained_variance | -0.694   |
| fps                | 825      |
| nupdates           | 928400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4642000  |
| value_loss         | 0.000451 |
---------------------------------
---------------------------------
| explained_variance | 0.384    |
| fps                | 825      |
| nupdates           | 928500   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.0126   |
| fps                | 825      |
| nupdates           | 931200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4656000  |
| value_loss         | 4.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.787    |
| fps                | 825      |
| nupdates           | 931300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4656500  |
| value_loss         | 7.16e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.256    |
| fps                | 825      |
| nupdates           | 931400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4657000  |
| value_loss         | 0.000374 |
---------------------------------
---------------------------------
| explained_variance | 0.899    |
| fps                | 825      |
| nupdates           | 931500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.949   |
| fps                | 825      |
| nupdates           | 934300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4671500  |
| value_loss         | 9.35e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.857    |
| fps                | 825      |
| nupdates           | 934400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4672000  |
| value_loss         | 0.00366  |
---------------------------------
---------------------------------
| explained_variance | 0.313    |
| fps                | 825      |
| nupdates           | 934500   |
| policy_entropy     | 1.94     |
| total_timesteps    | 4672500  |
| value_loss         | 0.115    |
---------------------------------
---------------------------------
| explained_variance | 0.37     |
| fps                | 825      |
| nupdates           | 934600   |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.605    |
| fps                | 825      |
| nupdates           | 937300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4686500  |
| value_loss         | 0.000299 |
---------------------------------
---------------------------------
| explained_variance | 0.871    |
| fps                | 825      |
| nupdates           | 937400   |
| policy_entropy     | 2.02     |
| total_timesteps    | 4687000  |
| value_loss         | 0.000163 |
---------------------------------
---------------------------------
| explained_variance | 0.109    |
| fps                | 825      |
| nupdates           | 937500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4687500  |
| value_loss         | 7.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.696    |
| fps                | 825      |
| nupdates           | 937600   |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.908    |
| fps                | 824      |
| nupdates           | 940300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4701500  |
| value_loss         | 0.000261 |
---------------------------------
---------------------------------
| explained_variance | -1.89    |
| fps                | 824      |
| nupdates           | 940400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4702000  |
| value_loss         | 0.000343 |
---------------------------------
---------------------------------
| explained_variance | 0.296    |
| fps                | 824      |
| nupdates           | 940500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4702500  |
| value_loss         | 3.97e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.134    |
| fps                | 824      |
| nupdates           | 940600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.914    |
| fps                | 825      |
| nupdates           | 943400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4717000  |
| value_loss         | 0.000139 |
---------------------------------
---------------------------------
| explained_variance | 0.908    |
| fps                | 825      |
| nupdates           | 943500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4717500  |
| value_loss         | 1.81e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 825      |
| nupdates           | 943600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4718000  |
| value_loss         | 2.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 825      |
| nupdates           | 943700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.268   |
| fps                | 824      |
| nupdates           | 946400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4732000  |
| value_loss         | 3.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.394    |
| fps                | 824      |
| nupdates           | 946500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4732500  |
| value_loss         | 0.000181 |
---------------------------------
---------------------------------
| explained_variance | 0.961    |
| fps                | 824      |
| nupdates           | 946600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4733000  |
| value_loss         | 6.99e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.0686  |
| fps                | 824      |
| nupdates           | 946700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.15    |
| fps                | 825      |
| nupdates           | 949500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4747500  |
| value_loss         | 0.000324 |
---------------------------------
---------------------------------
| explained_variance | 0.598    |
| fps                | 825      |
| nupdates           | 949600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4748000  |
| value_loss         | 0.000329 |
---------------------------------
---------------------------------
| explained_variance | -0.494   |
| fps                | 825      |
| nupdates           | 949700   |
| policy_entropy     | 2.01     |
| total_timesteps    | 4748500  |
| value_loss         | 0.000317 |
---------------------------------
---------------------------------
| explained_variance | 0.114    |
| fps                | 825      |
| nupdates           | 949800   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.995    |
| fps                | 824      |
| nupdates           | 952500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4762500  |
| value_loss         | 4.05e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.785    |
| fps                | 824      |
| nupdates           | 952600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4763000  |
| value_loss         | 4.9e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.879    |
| fps                | 824      |
| nupdates           | 952700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4763500  |
| value_loss         | 4.62e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.34    |
| fps                | 824      |
| nupdates           | 952800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.68    |
| fps                | 824      |
| nupdates           | 955500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4777500  |
| value_loss         | 0.000613 |
---------------------------------
----------------------------------
| explained_variance | -3.22e+03 |
| fps                | 824       |
| nupdates           | 955600    |
| policy_entropy     | 1.8       |
| total_timesteps    | 4778000   |
| value_loss         | 0.0997    |
----------------------------------
---------------------------------
| explained_variance | 0.936    |
| fps                | 824      |
| nupdates           | 955700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4778500  |
| value_loss         | 8.54e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.152   |
| fps                | 824      |
| nupdates           | 955800   |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | -0.317   |
| fps                | 825      |
| nupdates           | 958600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4793000  |
| value_loss         | 3.21e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.768    |
| fps                | 825      |
| nupdates           | 958700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4793500  |
| value_loss         | 3.82e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0169  |
| fps                | 825      |
| nupdates           | 958800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4794000  |
| value_loss         | 0.000142 |
---------------------------------
---------------------------------
| explained_variance | -38.8    |
| fps                | 825      |
| nupdates           | 958900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.401    |
| fps                | 824      |
| nupdates           | 961600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4808000  |
| value_loss         | 0.00023  |
---------------------------------
---------------------------------
| explained_variance | -2.04    |
| fps                | 824      |
| nupdates           | 961700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4808500  |
| value_loss         | 0.000268 |
---------------------------------
---------------------------------
| explained_variance | -0.991   |
| fps                | 824      |
| nupdates           | 961800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4809000  |
| value_loss         | 0.0024   |
---------------------------------
---------------------------------
| explained_variance | -0.0935  |
| fps                | 824      |
| nupdates           | 961900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.946    |
| fps                | 825      |
| nupdates           | 964700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4823500  |
| value_loss         | 1.24e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 825      |
| nupdates           | 964800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 4824000  |
| value_loss         | 2.81e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.895    |
| fps                | 825      |
| nupdates           | 964900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4824500  |
| value_loss         | 2.68e-05 |
---------------------------------
Eval num_timesteps=4825000, episode_reward=-4.80 +/- 0.60
Episode length: 791.90 +/- 189.28
---------------------------------
| explained_variance | 0.983    |
| fps                | 8

---------------------------------
| explained_variance | 0.857    |
| fps                | 824      |
| nupdates           | 967700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4838500  |
| value_loss         | 1.38e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.319    |
| fps                | 824      |
| nupdates           | 967800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4839000  |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | -2.49    |
| fps                | 824      |
| nupdates           | 967900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4839500  |
| value_loss         | 0.000209 |
---------------------------------
---------------------------------
| explained_variance | 0.895    |
| fps                | 824      |
| nupdates           | 968000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.253   |
| fps                | 824      |
| nupdates           | 970700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4853500  |
| value_loss         | 0.000524 |
---------------------------------
---------------------------------
| explained_variance | 0.882    |
| fps                | 824      |
| nupdates           | 970800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4854000  |
| value_loss         | 1.74e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0151   |
| fps                | 824      |
| nupdates           | 970900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4854500  |
| value_loss         | 0.00049  |
---------------------------------
---------------------------------
| explained_variance | 0.97     |
| fps                | 824      |
| nupdates           | 971000   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.976    |
| fps                | 825      |
| nupdates           | 973800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4869000  |
| value_loss         | 3.74e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.64    |
| fps                | 825      |
| nupdates           | 973900   |
| policy_entropy     | 1.99     |
| total_timesteps    | 4869500  |
| value_loss         | 0.000877 |
---------------------------------
---------------------------------
| explained_variance | 0.482    |
| fps                | 825      |
| nupdates           | 974000   |
| policy_entropy     | 1.99     |
| total_timesteps    | 4870000  |
| value_loss         | 0.000282 |
---------------------------------
---------------------------------
| explained_variance | -1.24    |
| fps                | 825      |
| nupdates           | 974100   |
| policy_entropy     | 1.87     |
| total_timest

---------------------------------
| explained_variance | -0.851   |
| fps                | 824      |
| nupdates           | 976800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4884000  |
| value_loss         | 0.00081  |
---------------------------------
---------------------------------
| explained_variance | -15      |
| fps                | 824      |
| nupdates           | 976900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4884500  |
| value_loss         | 0.00655  |
---------------------------------
---------------------------------
| explained_variance | -0.998   |
| fps                | 824      |
| nupdates           | 977000   |
| policy_entropy     | 1.99     |
| total_timesteps    | 4885000  |
| value_loss         | 0.00303  |
---------------------------------
---------------------------------
| explained_variance | -0.827   |
| fps                | 824      |
| nupdates           | 977100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.889    |
| fps                | 825      |
| nupdates           | 979900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4899500  |
| value_loss         | 5.95e-06 |
---------------------------------
Eval num_timesteps=4900000, episode_reward=-4.80 +/- 0.40
Episode length: 608.60 +/- 132.10
---------------------------------
| explained_variance | -5.37    |
| fps                | 824      |
| nupdates           | 980000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4900000  |
| value_loss         | 0.00275  |
---------------------------------
---------------------------------
| explained_variance | -22      |
| fps                | 824      |
| nupdates           | 980100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4900500  |
| value_loss         | 0.000793 |
---------------------------------
---------------------------------
| explained_variance | 0.91     |
| fps                | 8

---------------------------------
| explained_variance | 0.961    |
| fps                | 825      |
| nupdates           | 982900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 4914500  |
| value_loss         | 2.98e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.749    |
| fps                | 825      |
| nupdates           | 983000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4915000  |
| value_loss         | 3.1e-05  |
---------------------------------
---------------------------------
| explained_variance | -3.21    |
| fps                | 825      |
| nupdates           | 983100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4915500  |
| value_loss         | 0.43     |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 825      |
| nupdates           | 983200   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -1.1e+03 |
| fps                | 824      |
| nupdates           | 985900   |
| policy_entropy     | 1.89     |
| total_timesteps    | 4929500  |
| value_loss         | 0.065    |
---------------------------------
---------------------------------
| explained_variance | 0.81     |
| fps                | 824      |
| nupdates           | 986000   |
| policy_entropy     | 2        |
| total_timesteps    | 4930000  |
| value_loss         | 0.000278 |
---------------------------------
---------------------------------
| explained_variance | 0.959    |
| fps                | 824      |
| nupdates           | 986100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4930500  |
| value_loss         | 5.57e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.697   |
| fps                | 824      |
| nupdates           | 986200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.376    |
| fps                | 825      |
| nupdates           | 989000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 4945000  |
| value_loss         | 0.000304 |
---------------------------------
---------------------------------
| explained_variance | -0.461   |
| fps                | 825      |
| nupdates           | 989100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4945500  |
| value_loss         | 0.000472 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 825      |
| nupdates           | 989200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4946000  |
| value_loss         | 2.66e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.973    |
| fps                | 825      |
| nupdates           | 989300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.748    |
| fps                | 824      |
| nupdates           | 992000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4960000  |
| value_loss         | 0.000132 |
---------------------------------
---------------------------------
| explained_variance | 0.863    |
| fps                | 824      |
| nupdates           | 992100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4960500  |
| value_loss         | 7.67e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.754    |
| fps                | 824      |
| nupdates           | 992200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4961000  |
| value_loss         | 7.1e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.802    |
| fps                | 824      |
| nupdates           | 992300   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.105    |
| fps                | 824      |
| nupdates           | 995100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4975500  |
| value_loss         | 9.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.321    |
| fps                | 824      |
| nupdates           | 995200   |
| policy_entropy     | 1.81     |
| total_timesteps    | 4976000  |
| value_loss         | 0.000127 |
---------------------------------
---------------------------------
| explained_variance | -7.58    |
| fps                | 824      |
| nupdates           | 995300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4976500  |
| value_loss         | 0.000363 |
---------------------------------
---------------------------------
| explained_variance | -4.47    |
| fps                | 824      |
| nupdates           | 995400   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.352    |
| fps                | 824      |
| nupdates           | 998200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 4991000  |
| value_loss         | 0.000253 |
---------------------------------
---------------------------------
| explained_variance | 0.913    |
| fps                | 824      |
| nupdates           | 998300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 4991500  |
| value_loss         | 2.34e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.293    |
| fps                | 824      |
| nupdates           | 998400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 4992000  |
| value_loss         | 2.55e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.807    |
| fps                | 824      |
| nupdates           | 998500   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.979    |
| fps                | 824      |
| nupdates           | 1001200  |
| policy_entropy     | 2.01     |
| total_timesteps    | 5006000  |
| value_loss         | 1.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.885    |
| fps                | 824      |
| nupdates           | 1001300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5006500  |
| value_loss         | 8.44e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.158    |
| fps                | 824      |
| nupdates           | 1001400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5007000  |
| value_loss         | 0.000543 |
---------------------------------
---------------------------------
| explained_variance | 0.959    |
| fps                | 824      |
| nupdates           | 1001500  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -0.44    |
| fps                | 824      |
| nupdates           | 1004300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5021500  |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | 0.831    |
| fps                | 824      |
| nupdates           | 1004400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5022000  |
| value_loss         | 9.6e-06  |
---------------------------------
---------------------------------
| explained_variance | 0.163    |
| fps                | 824      |
| nupdates           | 1004500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5022500  |
| value_loss         | 2.97e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.848    |
| fps                | 824      |
| nupdates           | 1004600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.287    |
| fps                | 824      |
| nupdates           | 1007300  |
| policy_entropy     | 1.87     |
| total_timesteps    | 5036500  |
| value_loss         | 0.000448 |
---------------------------------
---------------------------------
| explained_variance | -34.1    |
| fps                | 824      |
| nupdates           | 1007400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5037000  |
| value_loss         | 0.00198  |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 824      |
| nupdates           | 1007500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5037500  |
| value_loss         | 3.08e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 824      |
| nupdates           | 1007600  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.83     |
| fps                | 824      |
| nupdates           | 1010300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5051500  |
| value_loss         | 3.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.724    |
| fps                | 824      |
| nupdates           | 1010400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5052000  |
| value_loss         | 4.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 824      |
| nupdates           | 1010500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5052500  |
| value_loss         | 2.38e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.913    |
| fps                | 824      |
| nupdates           | 1010600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -1.2     |
| fps                | 824      |
| nupdates           | 1013400  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5067000  |
| value_loss         | 5.79e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.572    |
| fps                | 824      |
| nupdates           | 1013500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5067500  |
| value_loss         | 9.96e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.252    |
| fps                | 824      |
| nupdates           | 1013600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5068000  |
| value_loss         | 3.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.432    |
| fps                | 824      |
| nupdates           | 1013700  |
| policy_entropy     | 1.26     |
| total_timest

---------------------------------
| explained_variance | -0.258   |
| fps                | 824      |
| nupdates           | 1016400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5082000  |
| value_loss         | 0.000231 |
---------------------------------
---------------------------------
| explained_variance | 0.843    |
| fps                | 824      |
| nupdates           | 1016500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5082500  |
| value_loss         | 4.36e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.75    |
| fps                | 824      |
| nupdates           | 1016600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5083000  |
| value_loss         | 0.00013  |
---------------------------------
---------------------------------
| explained_variance | 0.413    |
| fps                | 824      |
| nupdates           | 1016700  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.433    |
| fps                | 824      |
| nupdates           | 1019500  |
| policy_entropy     | 1.42     |
| total_timesteps    | 5097500  |
| value_loss         | 0.136    |
---------------------------------
---------------------------------
| explained_variance | 0.473    |
| fps                | 824      |
| nupdates           | 1019600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5098000  |
| value_loss         | 6.24e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.23    |
| fps                | 824      |
| nupdates           | 1019700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5098500  |
| value_loss         | 0.00088  |
---------------------------------
---------------------------------
| explained_variance | -3.2e+04 |
| fps                | 824      |
| nupdates           | 1019800  |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | 0.838    |
| fps                | 824      |
| nupdates           | 1022500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5112500  |
| value_loss         | 8.1e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.517    |
| fps                | 824      |
| nupdates           | 1022600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5113000  |
| value_loss         | 3.06e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.341   |
| fps                | 824      |
| nupdates           | 1022700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5113500  |
| value_loss         | 0.000122 |
---------------------------------
---------------------------------
| explained_variance | 0.984    |
| fps                | 824      |
| nupdates           | 1022800  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | -0.286   |
| fps                | 824      |
| nupdates           | 1025500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5127500  |
| value_loss         | 0.000373 |
---------------------------------
---------------------------------
| explained_variance | 0.215    |
| fps                | 824      |
| nupdates           | 1025600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5128000  |
| value_loss         | 3.79e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.643    |
| fps                | 824      |
| nupdates           | 1025700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5128500  |
| value_loss         | 0.000112 |
---------------------------------
---------------------------------
| explained_variance | 0.354    |
| fps                | 824      |
| nupdates           | 1025800  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.985    |
| fps                | 824      |
| nupdates           | 1028600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5143000  |
| value_loss         | 1.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.976    |
| fps                | 824      |
| nupdates           | 1028700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5143500  |
| value_loss         | 6.77e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.912    |
| fps                | 824      |
| nupdates           | 1028800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5144000  |
| value_loss         | 2.87e-05 |
---------------------------------
---------------------------------
| explained_variance | -28      |
| fps                | 824      |
| nupdates           | 1028900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.39    |
| fps                | 824      |
| nupdates           | 1031600  |
| policy_entropy     | 1.98     |
| total_timesteps    | 5158000  |
| value_loss         | 0.0011   |
---------------------------------
---------------------------------
| explained_variance | 0.596    |
| fps                | 824      |
| nupdates           | 1031700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5158500  |
| value_loss         | 7.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.97     |
| fps                | 824      |
| nupdates           | 1031800  |
| policy_entropy     | 1.94     |
| total_timesteps    | 5159000  |
| value_loss         | 9.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.901    |
| fps                | 824      |
| nupdates           | 1031900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.995    |
| fps                | 824      |
| nupdates           | 1034700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5173500  |
| value_loss         | 0.000137 |
---------------------------------
---------------------------------
| explained_variance | -0.487   |
| fps                | 824      |
| nupdates           | 1034800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5174000  |
| value_loss         | 0.00102  |
---------------------------------
---------------------------------
| explained_variance | 0.922    |
| fps                | 824      |
| nupdates           | 1034900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5174500  |
| value_loss         | 2.13e-05 |
---------------------------------
Eval num_timesteps=5175000, episode_reward=-4.70 +/- 0.46
Episode length: 600.90 +/- 83.73
---------------------------------
| explained_variance | -0.0563  |
| fps                | 82

---------------------------------
| explained_variance | -1.62    |
| fps                | 824      |
| nupdates           | 1037700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5188500  |
| value_loss         | 0.000488 |
---------------------------------
---------------------------------
| explained_variance | 0.438    |
| fps                | 824      |
| nupdates           | 1037800  |
| policy_entropy     | 1.99     |
| total_timesteps    | 5189000  |
| value_loss         | 0.13     |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 824      |
| nupdates           | 1037900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5189500  |
| value_loss         | 2.17e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.392   |
| fps                | 824      |
| nupdates           | 1038000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.843    |
| fps                | 824      |
| nupdates           | 1040700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5203500  |
| value_loss         | 1.33e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.398    |
| fps                | 824      |
| nupdates           | 1040800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5204000  |
| value_loss         | 5.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 1        |
| fps                | 824      |
| nupdates           | 1040900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5204500  |
| value_loss         | 1.21e-07 |
---------------------------------
---------------------------------
| explained_variance | -5.11    |
| fps                | 824      |
| nupdates           | 1041000  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.918    |
| fps                | 824      |
| nupdates           | 1043800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5219000  |
| value_loss         | 3.78e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.172    |
| fps                | 824      |
| nupdates           | 1043900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5219500  |
| value_loss         | 0.000417 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 824      |
| nupdates           | 1044000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5220000  |
| value_loss         | 3.54e-06 |
---------------------------------
---------------------------------
| explained_variance | -3.95    |
| fps                | 824      |
| nupdates           | 1044100  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.672    |
| fps                | 824      |
| nupdates           | 1046800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5234000  |
| value_loss         | 3.29e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 824      |
| nupdates           | 1046900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5234500  |
| value_loss         | 4.74e-07 |
---------------------------------
---------------------------------
| explained_variance | -0.273   |
| fps                | 824      |
| nupdates           | 1047000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5235000  |
| value_loss         | 0.000208 |
---------------------------------
---------------------------------
| explained_variance | 0.52     |
| fps                | 824      |
| nupdates           | 1047100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.345    |
| fps                | 824      |
| nupdates           | 1049900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5249500  |
| value_loss         | 1.12e-05 |
---------------------------------
Eval num_timesteps=5250000, episode_reward=-4.80 +/- 0.60
Episode length: 610.10 +/- 109.96
---------------------------------
| explained_variance | -0.793   |
| fps                | 824      |
| nupdates           | 1050000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5250000  |
| value_loss         | 0.00032  |
---------------------------------
---------------------------------
| explained_variance | 0.133    |
| fps                | 824      |
| nupdates           | 1050100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5250500  |
| value_loss         | 0.000227 |
---------------------------------
---------------------------------
| explained_variance | 0.758    |
| fps                | 8

---------------------------------
| explained_variance | 0.754    |
| fps                | 824      |
| nupdates           | 1052900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5264500  |
| value_loss         | 6.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.617    |
| fps                | 824      |
| nupdates           | 1053000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5265000  |
| value_loss         | 0.000405 |
---------------------------------
---------------------------------
| explained_variance | -0.107   |
| fps                | 824      |
| nupdates           | 1053100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5265500  |
| value_loss         | 0.000169 |
---------------------------------
---------------------------------
| explained_variance | 0.958    |
| fps                | 824      |
| nupdates           | 1053200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.941    |
| fps                | 824      |
| nupdates           | 1055900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5279500  |
| value_loss         | 3.49e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.391   |
| fps                | 824      |
| nupdates           | 1056000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5280000  |
| value_loss         | 0.000292 |
---------------------------------
---------------------------------
| explained_variance | -8.85    |
| fps                | 824      |
| nupdates           | 1056100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5280500  |
| value_loss         | 1.08     |
---------------------------------
---------------------------------
| explained_variance | -16.9    |
| fps                | 824      |
| nupdates           | 1056200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.778    |
| fps                | 824      |
| nupdates           | 1059000  |
| policy_entropy     | 2.02     |
| total_timesteps    | 5295000  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.841    |
| fps                | 824      |
| nupdates           | 1059100  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5295500  |
| value_loss         | 6.21e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.615   |
| fps                | 824      |
| nupdates           | 1059200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5296000  |
| value_loss         | 0.000432 |
---------------------------------
---------------------------------
| explained_variance | -0.855   |
| fps                | 824      |
| nupdates           | 1059300  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.931    |
| fps                | 824      |
| nupdates           | 1062000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5310000  |
| value_loss         | 9.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 824      |
| nupdates           | 1062100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5310500  |
| value_loss         | 1.9e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.165   |
| fps                | 824      |
| nupdates           | 1062200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5311000  |
| value_loss         | 8.41e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.32     |
| fps                | 824      |
| nupdates           | 1062300  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.4     |
| fps                | 824      |
| nupdates           | 1065100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5325500  |
| value_loss         | 0.00087  |
---------------------------------
---------------------------------
| explained_variance | 0.798    |
| fps                | 824      |
| nupdates           | 1065200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5326000  |
| value_loss         | 3.13e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.56    |
| fps                | 824      |
| nupdates           | 1065300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5326500  |
| value_loss         | 0.000291 |
---------------------------------
---------------------------------
| explained_variance | 0.668    |
| fps                | 824      |
| nupdates           | 1065400  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.826    |
| fps                | 824      |
| nupdates           | 1068200  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5341000  |
| value_loss         | 1.35e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.11    |
| fps                | 824      |
| nupdates           | 1068300  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5341500  |
| value_loss         | 0.000285 |
---------------------------------
---------------------------------
| explained_variance | 0.0414   |
| fps                | 824      |
| nupdates           | 1068400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5342000  |
| value_loss         | 0.000293 |
---------------------------------
---------------------------------
| explained_variance | -70.1    |
| fps                | 824      |
| nupdates           | 1068500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.805    |
| fps                | 824      |
| nupdates           | 1071200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5356000  |
| value_loss         | 3.69e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.381    |
| fps                | 824      |
| nupdates           | 1071300  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5356500  |
| value_loss         | 7.94e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0205  |
| fps                | 824      |
| nupdates           | 1071400  |
| policy_entropy     | 1.68     |
| total_timesteps    | 5357000  |
| value_loss         | 0.172    |
---------------------------------
---------------------------------
| explained_variance | 0.0981   |
| fps                | 824      |
| nupdates           | 1071500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.515    |
| fps                | 824      |
| nupdates           | 1074300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5371500  |
| value_loss         | 0.00019  |
---------------------------------
---------------------------------
| explained_variance | -11.7    |
| fps                | 824      |
| nupdates           | 1074400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5372000  |
| value_loss         | 0.00121  |
---------------------------------
---------------------------------
| explained_variance | -0.322   |
| fps                | 824      |
| nupdates           | 1074500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5372500  |
| value_loss         | 6.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.634    |
| fps                | 824      |
| nupdates           | 1074600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.81    |
| fps                | 824      |
| nupdates           | 1077300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5386500  |
| value_loss         | 0.00025  |
---------------------------------
---------------------------------
| explained_variance | -0.0977  |
| fps                | 824      |
| nupdates           | 1077400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5387000  |
| value_loss         | 0.000517 |
---------------------------------
---------------------------------
| explained_variance | -61.9    |
| fps                | 824      |
| nupdates           | 1077500  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5387500  |
| value_loss         | 0.00195  |
---------------------------------
---------------------------------
| explained_variance | 0.255    |
| fps                | 824      |
| nupdates           | 1077600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.315   |
| fps                | 823      |
| nupdates           | 1080300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5401500  |
| value_loss         | 0.000434 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 823      |
| nupdates           | 1080400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5402000  |
| value_loss         | 3.43e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.915   |
| fps                | 823      |
| nupdates           | 1080500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5402500  |
| value_loss         | 8.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.96     |
| fps                | 823      |
| nupdates           | 1080600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.864    |
| fps                | 823      |
| nupdates           | 1083400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5417000  |
| value_loss         | 3.45e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.634    |
| fps                | 823      |
| nupdates           | 1083500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5417500  |
| value_loss         | 9.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.763    |
| fps                | 823      |
| nupdates           | 1083600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5418000  |
| value_loss         | 0.000512 |
---------------------------------
---------------------------------
| explained_variance | 0.728    |
| fps                | 823      |
| nupdates           | 1083700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.102   |
| fps                | 823      |
| nupdates           | 1086400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5432000  |
| value_loss         | 0.000187 |
---------------------------------
---------------------------------
| explained_variance | 0.81     |
| fps                | 823      |
| nupdates           | 1086500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5432500  |
| value_loss         | 9.41e-06 |
---------------------------------
---------------------------------
| explained_variance | -4.03    |
| fps                | 823      |
| nupdates           | 1086600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5433000  |
| value_loss         | 5.49e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.135    |
| fps                | 823      |
| nupdates           | 1086700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -4.37    |
| fps                | 824      |
| nupdates           | 1089500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5447500  |
| value_loss         | 0.000243 |
---------------------------------
---------------------------------
| explained_variance | 0.776    |
| fps                | 824      |
| nupdates           | 1089600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5448000  |
| value_loss         | 0.00023  |
---------------------------------
---------------------------------
| explained_variance | 0.68     |
| fps                | 824      |
| nupdates           | 1089700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5448500  |
| value_loss         | 2.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.424    |
| fps                | 824      |
| nupdates           | 1089800  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -1.7     |
| fps                | 823      |
| nupdates           | 1092500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5462500  |
| value_loss         | 0.00184  |
---------------------------------
---------------------------------
| explained_variance | 0.317    |
| fps                | 823      |
| nupdates           | 1092600  |
| policy_entropy     | 1.18     |
| total_timesteps    | 5463000  |
| value_loss         | 0.194    |
---------------------------------
---------------------------------
| explained_variance | 0.958    |
| fps                | 823      |
| nupdates           | 1092700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5463500  |
| value_loss         | 5.26e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.583    |
| fps                | 823      |
| nupdates           | 1092800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.941    |
| fps                | 823      |
| nupdates           | 1095500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5477500  |
| value_loss         | 2.11e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.156    |
| fps                | 823      |
| nupdates           | 1095600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5478000  |
| value_loss         | 0.000145 |
---------------------------------
---------------------------------
| explained_variance | 0.898    |
| fps                | 823      |
| nupdates           | 1095700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5478500  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.899    |
| fps                | 823      |
| nupdates           | 1095800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0972   |
| fps                | 823      |
| nupdates           | 1098600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5493000  |
| value_loss         | 0.000416 |
---------------------------------
---------------------------------
| explained_variance | -1.42    |
| fps                | 823      |
| nupdates           | 1098700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5493500  |
| value_loss         | 0.000172 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 823      |
| nupdates           | 1098800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5494000  |
| value_loss         | 3.55e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 823      |
| nupdates           | 1098900  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -1.4     |
| fps                | 823      |
| nupdates           | 1101600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5508000  |
| value_loss         | 0.000704 |
---------------------------------
---------------------------------
| explained_variance | 0.838    |
| fps                | 823      |
| nupdates           | 1101700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5508500  |
| value_loss         | 3.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.223    |
| fps                | 823      |
| nupdates           | 1101800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5509000  |
| value_loss         | 5.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 823      |
| nupdates           | 1101900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.884    |
| fps                | 823      |
| nupdates           | 1104700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5523500  |
| value_loss         | 0.000184 |
---------------------------------
---------------------------------
| explained_variance | 0.355    |
| fps                | 823      |
| nupdates           | 1104800  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5524000  |
| value_loss         | 0.00086  |
---------------------------------
---------------------------------
| explained_variance | 0.635    |
| fps                | 823      |
| nupdates           | 1104900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5524500  |
| value_loss         | 0.00015  |
---------------------------------
Eval num_timesteps=5525000, episode_reward=-4.90 +/- 0.30
Episode length: 617.00 +/- 78.83
---------------------------------
| explained_variance | 0.651    |
| fps                | 82

---------------------------------
| explained_variance | 0.502    |
| fps                | 823      |
| nupdates           | 1107700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5538500  |
| value_loss         | 4.79e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.799    |
| fps                | 823      |
| nupdates           | 1107800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5539000  |
| value_loss         | 0.0002   |
---------------------------------
---------------------------------
| explained_variance | 0.964    |
| fps                | 823      |
| nupdates           | 1107900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5539500  |
| value_loss         | 2.16e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.749    |
| fps                | 823      |
| nupdates           | 1108000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.02    |
| fps                | 822      |
| nupdates           | 1110700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5553500  |
| value_loss         | 0.000596 |
---------------------------------
---------------------------------
| explained_variance | -2.55    |
| fps                | 822      |
| nupdates           | 1110800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5554000  |
| value_loss         | 0.000216 |
---------------------------------
---------------------------------
| explained_variance | -1.29    |
| fps                | 822      |
| nupdates           | 1110900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5554500  |
| value_loss         | 0.000307 |
---------------------------------
---------------------------------
| explained_variance | 0.686    |
| fps                | 822      |
| nupdates           | 1111000  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.906    |
| fps                | 823      |
| nupdates           | 1113800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5569000  |
| value_loss         | 3.41e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.256    |
| fps                | 823      |
| nupdates           | 1113900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5569500  |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | -216     |
| fps                | 823      |
| nupdates           | 1114000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5570000  |
| value_loss         | 0.0167   |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 823      |
| nupdates           | 1114100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.000514 |
| fps                | 822      |
| nupdates           | 1116800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5584000  |
| value_loss         | 0.00207  |
---------------------------------
---------------------------------
| explained_variance | 0.647    |
| fps                | 822      |
| nupdates           | 1116900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5584500  |
| value_loss         | 7.69e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.99     |
| fps                | 822      |
| nupdates           | 1117000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5585000  |
| value_loss         | 4.98e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.345    |
| fps                | 822      |
| nupdates           | 1117100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.89     |
| fps                | 823      |
| nupdates           | 1119900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5599500  |
| value_loss         | 0.000113 |
---------------------------------
Eval num_timesteps=5600000, episode_reward=-4.90 +/- 0.30
Episode length: 624.30 +/- 78.12
---------------------------------
| explained_variance | 0.613    |
| fps                | 822      |
| nupdates           | 1120000  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5600000  |
| value_loss         | 0.000125 |
---------------------------------
---------------------------------
| explained_variance | -0.139   |
| fps                | 822      |
| nupdates           | 1120100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5600500  |
| value_loss         | 0.000242 |
---------------------------------
---------------------------------
| explained_variance | -0.801   |
| fps                | 82

---------------------------------
| explained_variance | 0.0707   |
| fps                | 822      |
| nupdates           | 1122900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5614500  |
| value_loss         | 1.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.865    |
| fps                | 822      |
| nupdates           | 1123000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5615000  |
| value_loss         | 1.84e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.823   |
| fps                | 822      |
| nupdates           | 1123100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5615500  |
| value_loss         | 0.000197 |
---------------------------------
---------------------------------
| explained_variance | 0.982    |
| fps                | 822      |
| nupdates           | 1123200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.837    |
| fps                | 822      |
| nupdates           | 1125900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5629500  |
| value_loss         | 5.48e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.734    |
| fps                | 822      |
| nupdates           | 1126000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5630000  |
| value_loss         | 0.000206 |
---------------------------------
---------------------------------
| explained_variance | 0.918    |
| fps                | 822      |
| nupdates           | 1126100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5630500  |
| value_loss         | 2.36e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.72     |
| fps                | 822      |
| nupdates           | 1126200  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -1.17    |
| fps                | 823      |
| nupdates           | 1129000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5645000  |
| value_loss         | 0.000558 |
---------------------------------
---------------------------------
| explained_variance | -3.25    |
| fps                | 823      |
| nupdates           | 1129100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5645500  |
| value_loss         | 0.00033  |
---------------------------------
---------------------------------
| explained_variance | -55.8    |
| fps                | 823      |
| nupdates           | 1129200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5646000  |
| value_loss         | 0.0134   |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 823      |
| nupdates           | 1129300  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.396    |
| fps                | 823      |
| nupdates           | 1132000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5660000  |
| value_loss         | 2.46e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.37    |
| fps                | 823      |
| nupdates           | 1132100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5660500  |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | -35.1    |
| fps                | 823      |
| nupdates           | 1132200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5661000  |
| value_loss         | 0.00272  |
---------------------------------
---------------------------------
| explained_variance | 0.92     |
| fps                | 823      |
| nupdates           | 1132300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0254  |
| fps                | 822      |
| nupdates           | 1135100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5675500  |
| value_loss         | 4.54e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.317    |
| fps                | 822      |
| nupdates           | 1135200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5676000  |
| value_loss         | 0.000261 |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 822      |
| nupdates           | 1135300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5676500  |
| value_loss         | 2.46e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.95     |
| fps                | 822      |
| nupdates           | 1135400  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.00934 |
| fps                | 823      |
| nupdates           | 1138200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5691000  |
| value_loss         | 9.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.876    |
| fps                | 823      |
| nupdates           | 1138300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5691500  |
| value_loss         | 9.73e-05 |
---------------------------------
----------------------------------
| explained_variance | -1.06e+03 |
| fps                | 823       |
| nupdates           | 1138400   |
| policy_entropy     | 2.04      |
| total_timesteps    | 5692000   |
| value_loss         | 0.0712    |
----------------------------------
---------------------------------
| explained_variance | 0.968    |
| fps                | 823      |
| nupdates           | 1138500  |
| policy_entropy     | 2.07     |
| tota

---------------------------------
| explained_variance | 0.554    |
| fps                | 822      |
| nupdates           | 1141200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5706000  |
| value_loss         | 0.000212 |
---------------------------------
---------------------------------
| explained_variance | -7.62    |
| fps                | 822      |
| nupdates           | 1141300  |
| policy_entropy     | 2.01     |
| total_timesteps    | 5706500  |
| value_loss         | 0.00144  |
---------------------------------
---------------------------------
| explained_variance | 0.858    |
| fps                | 822      |
| nupdates           | 1141400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5707000  |
| value_loss         | 1.93e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.00435  |
| fps                | 822      |
| nupdates           | 1141500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.693    |
| fps                | 823      |
| nupdates           | 1144300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5721500  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | -1.03    |
| fps                | 823      |
| nupdates           | 1144400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5722000  |
| value_loss         | 0.000544 |
---------------------------------
---------------------------------
| explained_variance | 0.587    |
| fps                | 823      |
| nupdates           | 1144500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5722500  |
| value_loss         | 0.000433 |
---------------------------------
---------------------------------
| explained_variance | 0.233    |
| fps                | 823      |
| nupdates           | 1144600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.951    |
| fps                | 822      |
| nupdates           | 1147300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5736500  |
| value_loss         | 7.42e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.825    |
| fps                | 822      |
| nupdates           | 1147400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5737000  |
| value_loss         | 2.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.892    |
| fps                | 822      |
| nupdates           | 1147500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5737500  |
| value_loss         | 4.61e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.545    |
| fps                | 823      |
| nupdates           | 1147600  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.619    |
| fps                | 822      |
| nupdates           | 1150300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5751500  |
| value_loss         | 6.74e-05 |
---------------------------------
----------------------------------
| explained_variance | -4.01e+03 |
| fps                | 822       |
| nupdates           | 1150400   |
| policy_entropy     | 2.04      |
| total_timesteps    | 5752000   |
| value_loss         | 0.11      |
----------------------------------
---------------------------------
| explained_variance | -3.59    |
| fps                | 822      |
| nupdates           | 1150500  |
| policy_entropy     | 2        |
| total_timesteps    | 5752500  |
| value_loss         | 0.00178  |
---------------------------------
---------------------------------
| explained_variance | 0.982    |
| fps                | 822      |
| nupdates           | 1150600  |
| policy_entropy     | 2.07     |
| tota

---------------------------------
| explained_variance | 0.969    |
| fps                | 823      |
| nupdates           | 1153400  |
| policy_entropy     | 1.97     |
| total_timesteps    | 5767000  |
| value_loss         | 5.48e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.687    |
| fps                | 823      |
| nupdates           | 1153500  |
| policy_entropy     | 2.02     |
| total_timesteps    | 5767500  |
| value_loss         | 7.15e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.911   |
| fps                | 823      |
| nupdates           | 1153600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5768000  |
| value_loss         | 0.000397 |
---------------------------------
---------------------------------
| explained_variance | 0.529    |
| fps                | 823      |
| nupdates           | 1153700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.899    |
| fps                | 822      |
| nupdates           | 1156400  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5782000  |
| value_loss         | 3.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.972    |
| fps                | 822      |
| nupdates           | 1156500  |
| policy_entropy     | 2.01     |
| total_timesteps    | 5782500  |
| value_loss         | 2.41e-05 |
---------------------------------
---------------------------------
| explained_variance | -243     |
| fps                | 822      |
| nupdates           | 1156600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5783000  |
| value_loss         | 0.00735  |
---------------------------------
---------------------------------
| explained_variance | -0.00101 |
| fps                | 822      |
| nupdates           | 1156700  |
| policy_entropy     | 1.83     |
| total_timest

---------------------------------
| explained_variance | 0.851    |
| fps                | 823      |
| nupdates           | 1159500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5797500  |
| value_loss         | 4.32e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.467    |
| fps                | 823      |
| nupdates           | 1159600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5798000  |
| value_loss         | 7.17e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.838    |
| fps                | 823      |
| nupdates           | 1159700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5798500  |
| value_loss         | 0.000344 |
---------------------------------
---------------------------------
| explained_variance | 0.798    |
| fps                | 823      |
| nupdates           | 1159800  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -0.237   |
| fps                | 822      |
| nupdates           | 1162500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5812500  |
| value_loss         | 0.000706 |
---------------------------------
---------------------------------
| explained_variance | -2.54    |
| fps                | 822      |
| nupdates           | 1162600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5813000  |
| value_loss         | 0.000197 |
---------------------------------
---------------------------------
| explained_variance | -0.202   |
| fps                | 822      |
| nupdates           | 1162700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5813500  |
| value_loss         | 0.000249 |
---------------------------------
---------------------------------
| explained_variance | 0.438    |
| fps                | 822      |
| nupdates           | 1162800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.588    |
| fps                | 822      |
| nupdates           | 1165500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5827500  |
| value_loss         | 0.000291 |
---------------------------------
---------------------------------
| explained_variance | -0.243   |
| fps                | 822      |
| nupdates           | 1165600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5828000  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | 0.574    |
| fps                | 822      |
| nupdates           | 1165700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5828500  |
| value_loss         | 0.000276 |
---------------------------------
---------------------------------
| explained_variance | -0.0659  |
| fps                | 822      |
| nupdates           | 1165800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -10.5    |
| fps                | 823      |
| nupdates           | 1168600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5843000  |
| value_loss         | 0.00176  |
---------------------------------
---------------------------------
| explained_variance | 0.263    |
| fps                | 823      |
| nupdates           | 1168700  |
| policy_entropy     | 0.961    |
| total_timesteps    | 5843500  |
| value_loss         | 0.264    |
---------------------------------
---------------------------------
| explained_variance | -0.977   |
| fps                | 823      |
| nupdates           | 1168800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5844000  |
| value_loss         | 0.00124  |
---------------------------------
---------------------------------
| explained_variance | 0.851    |
| fps                | 823      |
| nupdates           | 1168900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.81    |
| fps                | 822      |
| nupdates           | 1171600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5858000  |
| value_loss         | 0.000373 |
---------------------------------
---------------------------------
| explained_variance | 0.099    |
| fps                | 822      |
| nupdates           | 1171700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5858500  |
| value_loss         | 4.97e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.142    |
| fps                | 822      |
| nupdates           | 1171800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5859000  |
| value_loss         | 0.00025  |
---------------------------------
---------------------------------
| explained_variance | 0.527    |
| fps                | 823      |
| nupdates           | 1171900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.738   |
| fps                | 823      |
| nupdates           | 1174700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5873500  |
| value_loss         | 0.000385 |
---------------------------------
---------------------------------
| explained_variance | 0.000965 |
| fps                | 823      |
| nupdates           | 1174800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5874000  |
| value_loss         | 6.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.72     |
| fps                | 823      |
| nupdates           | 1174900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5874500  |
| value_loss         | 0.00012  |
---------------------------------
Eval num_timesteps=5875000, episode_reward=-4.60 +/- 0.49
Episode length: 616.40 +/- 110.27
---------------------------------
| explained_variance | 0.15     |
| fps                | 8

---------------------------------
| explained_variance | -0.118   |
| fps                | 822      |
| nupdates           | 1177700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5888500  |
| value_loss         | 7.39e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.194   |
| fps                | 822      |
| nupdates           | 1177800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5889000  |
| value_loss         | 0.000328 |
---------------------------------
---------------------------------
| explained_variance | 0.868    |
| fps                | 822      |
| nupdates           | 1177900  |
| policy_entropy     | 2.01     |
| total_timesteps    | 5889500  |
| value_loss         | 0.000391 |
---------------------------------
---------------------------------
| explained_variance | 0.971    |
| fps                | 822      |
| nupdates           | 1178000  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.0088  |
| fps                | 822      |
| nupdates           | 1180700  |
| policy_entropy     | 1.4      |
| total_timesteps    | 5903500  |
| value_loss         | 0.155    |
---------------------------------
---------------------------------
| explained_variance | 0.677    |
| fps                | 822      |
| nupdates           | 1180800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5904000  |
| value_loss         | 2.26e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.817    |
| fps                | 822      |
| nupdates           | 1180900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5904500  |
| value_loss         | 8.75e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.363   |
| fps                | 822      |
| nupdates           | 1181000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.95     |
| fps                | 822      |
| nupdates           | 1183800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5919000  |
| value_loss         | 0.000104 |
---------------------------------
---------------------------------
| explained_variance | 0.957    |
| fps                | 822      |
| nupdates           | 1183900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5919500  |
| value_loss         | 1.28e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.05    |
| fps                | 822      |
| nupdates           | 1184000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5920000  |
| value_loss         | 0.000136 |
---------------------------------
---------------------------------
| explained_variance | 0.943    |
| fps                | 822      |
| nupdates           | 1184100  |
| policy_entropy     | 1.87     |
| total_timest

---------------------------------
| explained_variance | 0.816    |
| fps                | 822      |
| nupdates           | 1186800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5934000  |
| value_loss         | 7.16e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.509    |
| fps                | 822      |
| nupdates           | 1186900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5934500  |
| value_loss         | 4.64e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.958    |
| fps                | 822      |
| nupdates           | 1187000  |
| policy_entropy     | 2.03     |
| total_timesteps    | 5935000  |
| value_loss         | 5.89e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.526    |
| fps                | 822      |
| nupdates           | 1187100  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.926    |
| fps                | 822      |
| nupdates           | 1189900  |
| policy_entropy     | 2.02     |
| total_timesteps    | 5949500  |
| value_loss         | 6.14e-05 |
---------------------------------
Eval num_timesteps=5950000, episode_reward=-4.90 +/- 0.30
Episode length: 619.00 +/- 91.10
---------------------------------
| explained_variance | 0.654    |
| fps                | 822      |
| nupdates           | 1190000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5950000  |
| value_loss         | 2.54e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.667    |
| fps                | 822      |
| nupdates           | 1190100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 5950500  |
| value_loss         | 0.000227 |
---------------------------------
---------------------------------
| explained_variance | 0.541    |
| fps                | 82

---------------------------------
| explained_variance | 0.471    |
| fps                | 822      |
| nupdates           | 1192900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5964500  |
| value_loss         | 9.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.529    |
| fps                | 822      |
| nupdates           | 1193000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5965000  |
| value_loss         | 0.000468 |
---------------------------------
---------------------------------
| explained_variance | -8.97    |
| fps                | 822      |
| nupdates           | 1193100  |
| policy_entropy     | 2.04     |
| total_timesteps    | 5965500  |
| value_loss         | 0.00876  |
---------------------------------
---------------------------------
| explained_variance | -0.193   |
| fps                | 822      |
| nupdates           | 1193200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.689    |
| fps                | 822      |
| nupdates           | 1195900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 5979500  |
| value_loss         | 2.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.964    |
| fps                | 822      |
| nupdates           | 1196000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5980000  |
| value_loss         | 9.95e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.593    |
| fps                | 822      |
| nupdates           | 1196100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 5980500  |
| value_loss         | 0.000191 |
---------------------------------
---------------------------------
| explained_variance | -0.461   |
| fps                | 822      |
| nupdates           | 1196200  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.15     |
| fps                | 822      |
| nupdates           | 1199000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5995000  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 822      |
| nupdates           | 1199100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5995500  |
| value_loss         | 8.37e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.486    |
| fps                | 822      |
| nupdates           | 1199200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 5996000  |
| value_loss         | 2.67e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.951    |
| fps                | 822      |
| nupdates           | 1199300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.313   |
| fps                | 822      |
| nupdates           | 1202000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6010000  |
| value_loss         | 0.000338 |
---------------------------------
---------------------------------
| explained_variance | 0.982    |
| fps                | 822      |
| nupdates           | 1202100  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6010500  |
| value_loss         | 1.68e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.762    |
| fps                | 822      |
| nupdates           | 1202200  |
| policy_entropy     | 2.01     |
| total_timesteps    | 6011000  |
| value_loss         | 1.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.702    |
| fps                | 822      |
| nupdates           | 1202300  |
| policy_entropy     | 2.01     |
| total_timest

----------------------------------
| explained_variance | -1.04e+03 |
| fps                | 822       |
| nupdates           | 1205100   |
| policy_entropy     | 2.07      |
| total_timesteps    | 6025500   |
| value_loss         | 0.0705    |
----------------------------------
---------------------------------
| explained_variance | 0.214    |
| fps                | 822      |
| nupdates           | 1205200  |
| policy_entropy     | 1.99     |
| total_timesteps    | 6026000  |
| value_loss         | 0.206    |
---------------------------------
---------------------------------
| explained_variance | 0.648    |
| fps                | 822      |
| nupdates           | 1205300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6026500  |
| value_loss         | 6.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.971    |
| fps                | 822      |
| nupdates           | 1205400  |
| policy_entropy     | 2.04     |
| tota

---------------------------------
| explained_variance | -9.56    |
| fps                | 822      |
| nupdates           | 1208200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6041000  |
| value_loss         | 0.00471  |
---------------------------------
---------------------------------
| explained_variance | 0.96     |
| fps                | 822      |
| nupdates           | 1208300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6041500  |
| value_loss         | 1.14e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.934    |
| fps                | 822      |
| nupdates           | 1208400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6042000  |
| value_loss         | 2.76e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.0864  |
| fps                | 822      |
| nupdates           | 1208500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -2.36    |
| fps                | 822      |
| nupdates           | 1211200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6056000  |
| value_loss         | 7.25e-05 |
---------------------------------
---------------------------------
| explained_variance | -8.85    |
| fps                | 822      |
| nupdates           | 1211300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6056500  |
| value_loss         | 0.00028  |
---------------------------------
---------------------------------
| explained_variance | 0.443    |
| fps                | 822      |
| nupdates           | 1211400  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6057000  |
| value_loss         | 1.78e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.879    |
| fps                | 822      |
| nupdates           | 1211500  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.826    |
| fps                | 822      |
| nupdates           | 1214300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6071500  |
| value_loss         | 0.000638 |
---------------------------------
---------------------------------
| explained_variance | -12.3    |
| fps                | 822      |
| nupdates           | 1214400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6072000  |
| value_loss         | 0.000397 |
---------------------------------
---------------------------------
| explained_variance | 0.808    |
| fps                | 822      |
| nupdates           | 1214500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6072500  |
| value_loss         | 0.000161 |
---------------------------------
---------------------------------
| explained_variance | -0.202   |
| fps                | 822      |
| nupdates           | 1214600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.748    |
| fps                | 822      |
| nupdates           | 1217300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6086500  |
| value_loss         | 0.000146 |
---------------------------------
---------------------------------
| explained_variance | -14      |
| fps                | 822      |
| nupdates           | 1217400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6087000  |
| value_loss         | 0.0013   |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 822      |
| nupdates           | 1217500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6087500  |
| value_loss         | 3.33e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.836    |
| fps                | 822      |
| nupdates           | 1217600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.52     |
| fps                | 822      |
| nupdates           | 1220300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6101500  |
| value_loss         | 1.61e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0753  |
| fps                | 822      |
| nupdates           | 1220400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6102000  |
| value_loss         | 0.000128 |
---------------------------------
---------------------------------
| explained_variance | 0.666    |
| fps                | 822      |
| nupdates           | 1220500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6102500  |
| value_loss         | 0.000396 |
---------------------------------
---------------------------------
| explained_variance | -0.266   |
| fps                | 822      |
| nupdates           | 1220600  |
| policy_entropy     | 1.96     |
| total_timest

---------------------------------
| explained_variance | -0.315   |
| fps                | 822      |
| nupdates           | 1223400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6117000  |
| value_loss         | 5.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.101    |
| fps                | 822      |
| nupdates           | 1223500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6117500  |
| value_loss         | 0.000161 |
---------------------------------
---------------------------------
| explained_variance | 0.951    |
| fps                | 822      |
| nupdates           | 1223600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6118000  |
| value_loss         | 3.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.897    |
| fps                | 822      |
| nupdates           | 1223700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.989    |
| fps                | 822      |
| nupdates           | 1226400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6132000  |
| value_loss         | 6.33e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 822      |
| nupdates           | 1226500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6132500  |
| value_loss         | 9.78e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.877    |
| fps                | 822      |
| nupdates           | 1226600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6133000  |
| value_loss         | 8.54e-06 |
---------------------------------
---------------------------------
| explained_variance | -3.15    |
| fps                | 822      |
| nupdates           | 1226700  |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | -1.75    |
| fps                | 822      |
| nupdates           | 1229500  |
| policy_entropy     | 2.01     |
| total_timesteps    | 6147500  |
| value_loss         | 0.00189  |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 822      |
| nupdates           | 1229600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6148000  |
| value_loss         | 5.3e-06  |
---------------------------------
---------------------------------
| explained_variance | -3.11    |
| fps                | 822      |
| nupdates           | 1229700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6148500  |
| value_loss         | 0.0166   |
---------------------------------
---------------------------------
| explained_variance | -0.891   |
| fps                | 822      |
| nupdates           | 1229800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.991    |
| fps                | 822      |
| nupdates           | 1232500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6162500  |
| value_loss         | 4.92e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.914    |
| fps                | 822      |
| nupdates           | 1232600  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6163000  |
| value_loss         | 9.34e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.837    |
| fps                | 822      |
| nupdates           | 1232700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6163500  |
| value_loss         | 1.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 822      |
| nupdates           | 1232800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -43.2    |
| fps                | 822      |
| nupdates           | 1235500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6177500  |
| value_loss         | 0.005    |
---------------------------------
---------------------------------
| explained_variance | 0.355    |
| fps                | 822      |
| nupdates           | 1235600  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6178000  |
| value_loss         | 0.101    |
---------------------------------
---------------------------------
| explained_variance | 0.984    |
| fps                | 822      |
| nupdates           | 1235700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6178500  |
| value_loss         | 5.06e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.353    |
| fps                | 822      |
| nupdates           | 1235800  |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.8      |
| fps                | 822      |
| nupdates           | 1238600  |
| policy_entropy     | 2.01     |
| total_timesteps    | 6193000  |
| value_loss         | 0.000186 |
---------------------------------
---------------------------------
| explained_variance | -0.667   |
| fps                | 822      |
| nupdates           | 1238700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6193500  |
| value_loss         | 7.87e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.474   |
| fps                | 822      |
| nupdates           | 1238800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6194000  |
| value_loss         | 0.000393 |
---------------------------------
---------------------------------
| explained_variance | 0.86     |
| fps                | 822      |
| nupdates           | 1238900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.965    |
| fps                | 822      |
| nupdates           | 1241600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6208000  |
| value_loss         | 9.73e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.78    |
| fps                | 822      |
| nupdates           | 1241700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6208500  |
| value_loss         | 0.000194 |
---------------------------------
---------------------------------
| explained_variance | 0.969    |
| fps                | 822      |
| nupdates           | 1241800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6209000  |
| value_loss         | 7.86e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.924    |
| fps                | 822      |
| nupdates           | 1241900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.347   |
| fps                | 822      |
| nupdates           | 1244700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6223500  |
| value_loss         | 0.000307 |
---------------------------------
---------------------------------
| explained_variance | -702     |
| fps                | 822      |
| nupdates           | 1244800  |
| policy_entropy     | 1.8      |
| total_timesteps    | 6224000  |
| value_loss         | 0.0646   |
---------------------------------
---------------------------------
| explained_variance | -1.66    |
| fps                | 822      |
| nupdates           | 1244900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6224500  |
| value_loss         | 0.000306 |
---------------------------------
Eval num_timesteps=6225000, episode_reward=-4.80 +/- 0.40
Episode length: 553.60 +/- 105.28
---------------------------------
| explained_variance | 0.296    |
| fps                | 8

---------------------------------
| explained_variance | -1.23    |
| fps                | 822      |
| nupdates           | 1247700  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6238500  |
| value_loss         | 0.000858 |
---------------------------------
---------------------------------
| explained_variance | 0.257    |
| fps                | 822      |
| nupdates           | 1247800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6239000  |
| value_loss         | 0.000213 |
---------------------------------
---------------------------------
| explained_variance | 0.893    |
| fps                | 822      |
| nupdates           | 1247900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6239500  |
| value_loss         | 0.000256 |
---------------------------------
---------------------------------
| explained_variance | 0.368    |
| fps                | 822      |
| nupdates           | 1248000  |
| policy_entropy     | 1.71     |
| total_timest

---------------------------------
| explained_variance | 0.776    |
| fps                | 821      |
| nupdates           | 1250700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6253500  |
| value_loss         | 5.22e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.817    |
| fps                | 821      |
| nupdates           | 1250800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6254000  |
| value_loss         | 3.28e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.869    |
| fps                | 821      |
| nupdates           | 1250900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6254500  |
| value_loss         | 1.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.99     |
| fps                | 821      |
| nupdates           | 1251000  |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | 0.881    |
| fps                | 822      |
| nupdates           | 1253800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6269000  |
| value_loss         | 8.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 822      |
| nupdates           | 1253900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6269500  |
| value_loss         | 3.74e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 822      |
| nupdates           | 1254000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6270000  |
| value_loss         | 6.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.708    |
| fps                | 822      |
| nupdates           | 1254100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.819    |
| fps                | 821      |
| nupdates           | 1256800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6284000  |
| value_loss         | 1.93e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.775   |
| fps                | 821      |
| nupdates           | 1256900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6284500  |
| value_loss         | 0.000214 |
---------------------------------
---------------------------------
| explained_variance | -0.478   |
| fps                | 822      |
| nupdates           | 1257000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6285000  |
| value_loss         | 0.000533 |
---------------------------------
---------------------------------
| explained_variance | 0.879    |
| fps                | 822      |
| nupdates           | 1257100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.611    |
| fps                | 822      |
| nupdates           | 1259900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6299500  |
| value_loss         | 0.000202 |
---------------------------------
Eval num_timesteps=6300000, episode_reward=-4.80 +/- 0.40
Episode length: 649.80 +/- 118.31
---------------------------------
| explained_variance | -4.82    |
| fps                | 821      |
| nupdates           | 1260000  |
| policy_entropy     | 1.9      |
| total_timesteps    | 6300000  |
| value_loss         | 0.00312  |
---------------------------------
---------------------------------
| explained_variance | 0.22     |
| fps                | 821      |
| nupdates           | 1260100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6300500  |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | -3.25    |
| fps                | 8

---------------------------------
| explained_variance | 0.945    |
| fps                | 822      |
| nupdates           | 1262900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6314500  |
| value_loss         | 1.32e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.485   |
| fps                | 822      |
| nupdates           | 1263000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6315000  |
| value_loss         | 0.000411 |
---------------------------------
---------------------------------
| explained_variance | -0.0391  |
| fps                | 822      |
| nupdates           | 1263100  |
| policy_entropy     | 2        |
| total_timesteps    | 6315500  |
| value_loss         | 0.00124  |
---------------------------------
---------------------------------
| explained_variance | 0.943    |
| fps                | 822      |
| nupdates           | 1263200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.534   |
| fps                | 821      |
| nupdates           | 1265900  |
| policy_entropy     | 2        |
| total_timesteps    | 6329500  |
| value_loss         | 0.00045  |
---------------------------------
---------------------------------
| explained_variance | 0.245    |
| fps                | 821      |
| nupdates           | 1266000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6330000  |
| value_loss         | 0.000347 |
---------------------------------
---------------------------------
| explained_variance | 0.936    |
| fps                | 822      |
| nupdates           | 1266100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6330500  |
| value_loss         | 3.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 822      |
| nupdates           | 1266200  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.0618   |
| fps                | 822      |
| nupdates           | 1269000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6345000  |
| value_loss         | 0.000186 |
---------------------------------
---------------------------------
| explained_variance | -0.483   |
| fps                | 822      |
| nupdates           | 1269100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6345500  |
| value_loss         | 0.000135 |
---------------------------------
---------------------------------
| explained_variance | 0.126    |
| fps                | 822      |
| nupdates           | 1269200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6346000  |
| value_loss         | 0.000459 |
---------------------------------
---------------------------------
| explained_variance | -0.0041  |
| fps                | 822      |
| nupdates           | 1269300  |
| policy_entropy     | 1.32     |
| total_timest

---------------------------------
| explained_variance | 0.283    |
| fps                | 822      |
| nupdates           | 1272000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6360000  |
| value_loss         | 0.000135 |
---------------------------------
---------------------------------
| explained_variance | 0.648    |
| fps                | 822      |
| nupdates           | 1272100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6360500  |
| value_loss         | 0.000156 |
---------------------------------
---------------------------------
| explained_variance | 0.381    |
| fps                | 822      |
| nupdates           | 1272200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6361000  |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | 0.907    |
| fps                | 822      |
| nupdates           | 1272300  |
| policy_entropy     | 1.94     |
| total_timest

---------------------------------
| explained_variance | -17      |
| fps                | 821      |
| nupdates           | 1275100  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6375500  |
| value_loss         | 0.0019   |
---------------------------------
---------------------------------
| explained_variance | -1.44    |
| fps                | 821      |
| nupdates           | 1275200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6376000  |
| value_loss         | 0.000753 |
---------------------------------
---------------------------------
| explained_variance | -0.0417  |
| fps                | 821      |
| nupdates           | 1275300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6376500  |
| value_loss         | 0.00012  |
---------------------------------
---------------------------------
| explained_variance | 0.706    |
| fps                | 821      |
| nupdates           | 1275400  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.159    |
| fps                | 822      |
| nupdates           | 1278200  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6391000  |
| value_loss         | 0.000241 |
---------------------------------
---------------------------------
| explained_variance | 0.859    |
| fps                | 822      |
| nupdates           | 1278300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6391500  |
| value_loss         | 3.09e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.74    |
| fps                | 822      |
| nupdates           | 1278400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6392000  |
| value_loss         | 6.41e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.906    |
| fps                | 822      |
| nupdates           | 1278500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.959    |
| fps                | 821      |
| nupdates           | 1281200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6406000  |
| value_loss         | 1.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.917    |
| fps                | 821      |
| nupdates           | 1281300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6406500  |
| value_loss         | 0.000143 |
---------------------------------
---------------------------------
| explained_variance | -0.348   |
| fps                | 821      |
| nupdates           | 1281400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6407000  |
| value_loss         | 0.000263 |
---------------------------------
---------------------------------
| explained_variance | 0.933    |
| fps                | 821      |
| nupdates           | 1281500  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.397    |
| fps                | 822      |
| nupdates           | 1284300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6421500  |
| value_loss         | 7.7e-05  |
---------------------------------
----------------------------------
| explained_variance | -1.13e+03 |
| fps                | 822       |
| nupdates           | 1284400   |
| policy_entropy     | 2.05      |
| total_timesteps    | 6422000   |
| value_loss         | 0.0303    |
----------------------------------
---------------------------------
| explained_variance | 0.179    |
| fps                | 822      |
| nupdates           | 1284500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6422500  |
| value_loss         | 5.99e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.343    |
| fps                | 822      |
| nupdates           | 1284600  |
| policy_entropy     | 2        |
| tota

---------------------------------
| explained_variance | -6.11    |
| fps                | 822      |
| nupdates           | 1287300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6436500  |
| value_loss         | 0.000521 |
---------------------------------
---------------------------------
| explained_variance | -0.417   |
| fps                | 822      |
| nupdates           | 1287400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6437000  |
| value_loss         | 0.000364 |
---------------------------------
---------------------------------
| explained_variance | -4.11    |
| fps                | 822      |
| nupdates           | 1287500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6437500  |
| value_loss         | 0.00128  |
---------------------------------
---------------------------------
| explained_variance | 0.558    |
| fps                | 822      |
| nupdates           | 1287600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.812    |
| fps                | 821      |
| nupdates           | 1290300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6451500  |
| value_loss         | 1.35e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.35    |
| fps                | 821      |
| nupdates           | 1290400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6452000  |
| value_loss         | 0.00138  |
---------------------------------
---------------------------------
| explained_variance | -18      |
| fps                | 821      |
| nupdates           | 1290500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6452500  |
| value_loss         | 0.00104  |
---------------------------------
---------------------------------
| explained_variance | 0.416    |
| fps                | 821      |
| nupdates           | 1290600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.798    |
| fps                | 822      |
| nupdates           | 1293400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6467000  |
| value_loss         | 0.000263 |
---------------------------------
---------------------------------
| explained_variance | 0.834    |
| fps                | 822      |
| nupdates           | 1293500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6467500  |
| value_loss         | 0.00043  |
---------------------------------
---------------------------------
| explained_variance | 0.683    |
| fps                | 822      |
| nupdates           | 1293600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6468000  |
| value_loss         | 0.000353 |
---------------------------------
---------------------------------
| explained_variance | 0.0846   |
| fps                | 822      |
| nupdates           | 1293700  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.729    |
| fps                | 821      |
| nupdates           | 1296400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6482000  |
| value_loss         | 3.37e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.645    |
| fps                | 821      |
| nupdates           | 1296500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6482500  |
| value_loss         | 7.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0313   |
| fps                | 821      |
| nupdates           | 1296600  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6483000  |
| value_loss         | 0.000171 |
---------------------------------
---------------------------------
| explained_variance | -1.21    |
| fps                | 821      |
| nupdates           | 1296700  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.0407  |
| fps                | 822      |
| nupdates           | 1299500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6497500  |
| value_loss         | 0.000129 |
---------------------------------
---------------------------------
| explained_variance | 0.17     |
| fps                | 822      |
| nupdates           | 1299600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6498000  |
| value_loss         | 5.48e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0817  |
| fps                | 822      |
| nupdates           | 1299700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6498500  |
| value_loss         | 0.00331  |
---------------------------------
---------------------------------
| explained_variance | 0.965    |
| fps                | 822      |
| nupdates           | 1299800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.716    |
| fps                | 821      |
| nupdates           | 1302500  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6512500  |
| value_loss         | 1.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0199   |
| fps                | 821      |
| nupdates           | 1302600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6513000  |
| value_loss         | 0.000268 |
---------------------------------
---------------------------------
| explained_variance | 0.426    |
| fps                | 821      |
| nupdates           | 1302700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6513500  |
| value_loss         | 0.000284 |
---------------------------------
---------------------------------
| explained_variance | 0.433    |
| fps                | 821      |
| nupdates           | 1302800  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -4.83    |
| fps                | 821      |
| nupdates           | 1305500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6527500  |
| value_loss         | 0.0004   |
---------------------------------
---------------------------------
| explained_variance | -0.635   |
| fps                | 821      |
| nupdates           | 1305600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6528000  |
| value_loss         | 0.000466 |
---------------------------------
---------------------------------
| explained_variance | -0.272   |
| fps                | 821      |
| nupdates           | 1305700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6528500  |
| value_loss         | 0.000126 |
---------------------------------
---------------------------------
| explained_variance | 0.646    |
| fps                | 821      |
| nupdates           | 1305800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.982    |
| fps                | 821      |
| nupdates           | 1308600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6543000  |
| value_loss         | 6.97e-06 |
---------------------------------
---------------------------------
| explained_variance | -6.91    |
| fps                | 821      |
| nupdates           | 1308700  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6543500  |
| value_loss         | 0.000637 |
---------------------------------
---------------------------------
| explained_variance | 0.969    |
| fps                | 821      |
| nupdates           | 1308800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6544000  |
| value_loss         | 2.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.476    |
| fps                | 821      |
| nupdates           | 1308900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.0345  |
| fps                | 821      |
| nupdates           | 1311600  |
| policy_entropy     | 1.99     |
| total_timesteps    | 6558000  |
| value_loss         | 0.234    |
---------------------------------
---------------------------------
| explained_variance | 0.0765   |
| fps                | 821      |
| nupdates           | 1311700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6558500  |
| value_loss         | 9.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.213    |
| fps                | 821      |
| nupdates           | 1311800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6559000  |
| value_loss         | 0.000187 |
---------------------------------
---------------------------------
| explained_variance | 0.625    |
| fps                | 821      |
| nupdates           | 1311900  |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.656    |
| fps                | 821      |
| nupdates           | 1314700  |
| policy_entropy     | 2        |
| total_timesteps    | 6573500  |
| value_loss         | 3.57e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.00555 |
| fps                | 821      |
| nupdates           | 1314800  |
| policy_entropy     | 1.95     |
| total_timesteps    | 6574000  |
| value_loss         | 0.195    |
---------------------------------
---------------------------------
| explained_variance | -7.58    |
| fps                | 821      |
| nupdates           | 1314900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6574500  |
| value_loss         | 0.000219 |
---------------------------------
Eval num_timesteps=6575000, episode_reward=-5.00 +/- 0.00
Episode length: 589.50 +/- 115.10
---------------------------------
| explained_variance | -0.137   |
| fps                | 8

---------------------------------
| explained_variance | 0.509    |
| fps                | 821      |
| nupdates           | 1317700  |
| policy_entropy     | 1.82     |
| total_timesteps    | 6588500  |
| value_loss         | 0.00111  |
---------------------------------
---------------------------------
| explained_variance | -0.0785  |
| fps                | 821      |
| nupdates           | 1317800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6589000  |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | -1.86    |
| fps                | 821      |
| nupdates           | 1317900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6589500  |
| value_loss         | 0.000231 |
---------------------------------
---------------------------------
| explained_variance | 0.904    |
| fps                | 821      |
| nupdates           | 1318000  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.0382  |
| fps                | 821      |
| nupdates           | 1320700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6603500  |
| value_loss         | 9.73e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.471    |
| fps                | 821      |
| nupdates           | 1320800  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6604000  |
| value_loss         | 2.41e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.695    |
| fps                | 821      |
| nupdates           | 1320900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6604500  |
| value_loss         | 0.000505 |
---------------------------------
---------------------------------
| explained_variance | 0.326    |
| fps                | 821      |
| nupdates           | 1321000  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.289    |
| fps                | 821      |
| nupdates           | 1323800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6619000  |
| value_loss         | 0.000193 |
---------------------------------
---------------------------------
| explained_variance | 0.403    |
| fps                | 821      |
| nupdates           | 1323900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6619500  |
| value_loss         | 0.000135 |
---------------------------------
---------------------------------
| explained_variance | -0.119   |
| fps                | 821      |
| nupdates           | 1324000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6620000  |
| value_loss         | 0.000689 |
---------------------------------
---------------------------------
| explained_variance | 0.906    |
| fps                | 821      |
| nupdates           | 1324100  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.458    |
| fps                | 821      |
| nupdates           | 1326800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6634000  |
| value_loss         | 0.000166 |
---------------------------------
---------------------------------
| explained_variance | -1.91    |
| fps                | 821      |
| nupdates           | 1326900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6634500  |
| value_loss         | 0.000179 |
---------------------------------
---------------------------------
| explained_variance | -1.38    |
| fps                | 821      |
| nupdates           | 1327000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6635000  |
| value_loss         | 0.000319 |
---------------------------------
---------------------------------
| explained_variance | 0.943    |
| fps                | 821      |
| nupdates           | 1327100  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -2.43    |
| fps                | 821      |
| nupdates           | 1329900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6649500  |
| value_loss         | 0.00122  |
---------------------------------
Eval num_timesteps=6650000, episode_reward=-4.80 +/- 0.60
Episode length: 547.50 +/- 106.11
---------------------------------
| explained_variance | 0.291    |
| fps                | 821      |
| nupdates           | 1330000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6650000  |
| value_loss         | 0.000239 |
---------------------------------
---------------------------------
| explained_variance | 0.649    |
| fps                | 821      |
| nupdates           | 1330100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6650500  |
| value_loss         | 9.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.625    |
| fps                | 8

---------------------------------
| explained_variance | -0.101   |
| fps                | 821      |
| nupdates           | 1332900  |
| policy_entropy     | 2        |
| total_timesteps    | 6664500  |
| value_loss         | 0.000135 |
---------------------------------
---------------------------------
| explained_variance | 0.268    |
| fps                | 821      |
| nupdates           | 1333000  |
| policy_entropy     | 1.98     |
| total_timesteps    | 6665000  |
| value_loss         | 5.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0955   |
| fps                | 821      |
| nupdates           | 1333100  |
| policy_entropy     | 2.02     |
| total_timesteps    | 6665500  |
| value_loss         | 0.000273 |
---------------------------------
---------------------------------
| explained_variance | 0.29     |
| fps                | 821      |
| nupdates           | 1333200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.263    |
| fps                | 821      |
| nupdates           | 1335900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6679500  |
| value_loss         | 0.000467 |
---------------------------------
---------------------------------
| explained_variance | -0.058   |
| fps                | 821      |
| nupdates           | 1336000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6680000  |
| value_loss         | 0.000194 |
---------------------------------
---------------------------------
| explained_variance | 0.872    |
| fps                | 821      |
| nupdates           | 1336100  |
| policy_entropy     | 2        |
| total_timesteps    | 6680500  |
| value_loss         | 0.000202 |
---------------------------------
---------------------------------
| explained_variance | 0.47     |
| fps                | 821      |
| nupdates           | 1336200  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.04    |
| fps                | 821      |
| nupdates           | 1339000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6695000  |
| value_loss         | 0.000317 |
---------------------------------
---------------------------------
| explained_variance | 0.979    |
| fps                | 821      |
| nupdates           | 1339100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6695500  |
| value_loss         | 1.55e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0146   |
| fps                | 821      |
| nupdates           | 1339200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6696000  |
| value_loss         | 0.00044  |
---------------------------------
---------------------------------
| explained_variance | 0.893    |
| fps                | 821      |
| nupdates           | 1339300  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.788    |
| fps                | 821      |
| nupdates           | 1342000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6710000  |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | 0.606    |
| fps                | 821      |
| nupdates           | 1342100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6710500  |
| value_loss         | 9.44e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0641  |
| fps                | 821      |
| nupdates           | 1342200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6711000  |
| value_loss         | 4.38e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.841    |
| fps                | 821      |
| nupdates           | 1342300  |
| policy_entropy     | 1.55     |
| total_timest

---------------------------------
| explained_variance | 0.21     |
| fps                | 821      |
| nupdates           | 1345100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6725500  |
| value_loss         | 7.5e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.627    |
| fps                | 821      |
| nupdates           | 1345200  |
| policy_entropy     | 1.72     |
| total_timesteps    | 6726000  |
| value_loss         | 9.65e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.175    |
| fps                | 821      |
| nupdates           | 1345300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6726500  |
| value_loss         | 7.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.19     |
| fps                | 821      |
| nupdates           | 1345400  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.978    |
| fps                | 821      |
| nupdates           | 1348200  |
| policy_entropy     | 1.99     |
| total_timesteps    | 6741000  |
| value_loss         | 5.91e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 821      |
| nupdates           | 1348300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6741500  |
| value_loss         | 8.38e-07 |
---------------------------------
---------------------------------
| explained_variance | 0.195    |
| fps                | 821      |
| nupdates           | 1348400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6742000  |
| value_loss         | 6.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.55     |
| fps                | 821      |
| nupdates           | 1348500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -86      |
| fps                | 821      |
| nupdates           | 1351200  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6756000  |
| value_loss         | 0.014    |
---------------------------------
---------------------------------
| explained_variance | 0.864    |
| fps                | 821      |
| nupdates           | 1351300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6756500  |
| value_loss         | 0.0002   |
---------------------------------
---------------------------------
| explained_variance | 0.922    |
| fps                | 821      |
| nupdates           | 1351400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6757000  |
| value_loss         | 3.13e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.107   |
| fps                | 821      |
| nupdates           | 1351500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.98    |
| fps                | 821      |
| nupdates           | 1354300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6771500  |
| value_loss         | 0.00224  |
---------------------------------
---------------------------------
| explained_variance | 0.742    |
| fps                | 821      |
| nupdates           | 1354400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6772000  |
| value_loss         | 4.32e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.536    |
| fps                | 821      |
| nupdates           | 1354500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6772500  |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | 0.877    |
| fps                | 821      |
| nupdates           | 1354600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.937    |
| fps                | 821      |
| nupdates           | 1357300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6786500  |
| value_loss         | 3.14e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.853   |
| fps                | 821      |
| nupdates           | 1357400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6787000  |
| value_loss         | 0.000426 |
---------------------------------
---------------------------------
| explained_variance | 0.828    |
| fps                | 821      |
| nupdates           | 1357500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6787500  |
| value_loss         | 2.84e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.891    |
| fps                | 821      |
| nupdates           | 1357600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.565    |
| fps                | 821      |
| nupdates           | 1360300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6801500  |
| value_loss         | 8.01e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 821      |
| nupdates           | 1360400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6802000  |
| value_loss         | 7.62e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.941    |
| fps                | 821      |
| nupdates           | 1360500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6802500  |
| value_loss         | 5.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.365    |
| fps                | 821      |
| nupdates           | 1360600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.135    |
| fps                | 821      |
| nupdates           | 1363400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6817000  |
| value_loss         | 0.000298 |
---------------------------------
---------------------------------
| explained_variance | -0.362   |
| fps                | 821      |
| nupdates           | 1363500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6817500  |
| value_loss         | 7.95e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.753    |
| fps                | 821      |
| nupdates           | 1363600  |
| policy_entropy     | 2.01     |
| total_timesteps    | 6818000  |
| value_loss         | 1.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.269    |
| fps                | 821      |
| nupdates           | 1363700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.47    |
| fps                | 821      |
| nupdates           | 1366400  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6832000  |
| value_loss         | 0.00024  |
---------------------------------
---------------------------------
| explained_variance | 0.47     |
| fps                | 821      |
| nupdates           | 1366500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6832500  |
| value_loss         | 0.00035  |
---------------------------------
---------------------------------
| explained_variance | 0.486    |
| fps                | 821      |
| nupdates           | 1366600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6833000  |
| value_loss         | 6.83e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 821      |
| nupdates           | 1366700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.00284 |
| fps                | 821      |
| nupdates           | 1369500  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6847500  |
| value_loss         | 0.000587 |
---------------------------------
---------------------------------
| explained_variance | 0.97     |
| fps                | 821      |
| nupdates           | 1369600  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6848000  |
| value_loss         | 5.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.358    |
| fps                | 821      |
| nupdates           | 1369700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6848500  |
| value_loss         | 3.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 821      |
| nupdates           | 1369800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.443    |
| fps                | 821      |
| nupdates           | 1372500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 6862500  |
| value_loss         | 5.86e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.358    |
| fps                | 821      |
| nupdates           | 1372600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6863000  |
| value_loss         | 0.000183 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 821      |
| nupdates           | 1372700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 6863500  |
| value_loss         | 6.15e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.984    |
| fps                | 821      |
| nupdates           | 1372800  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.467    |
| fps                | 821      |
| nupdates           | 1375500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6877500  |
| value_loss         | 2.41e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0445   |
| fps                | 821      |
| nupdates           | 1375600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6878000  |
| value_loss         | 3.31e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.91     |
| fps                | 821      |
| nupdates           | 1375700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 6878500  |
| value_loss         | 8.1e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.337    |
| fps                | 821      |
| nupdates           | 1375800  |
| policy_entropy     | 1.35     |
| total_timest

---------------------------------
| explained_variance | -0.374   |
| fps                | 821      |
| nupdates           | 1378600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6893000  |
| value_loss         | 0.000469 |
---------------------------------
---------------------------------
| explained_variance | 0.933    |
| fps                | 821      |
| nupdates           | 1378700  |
| policy_entropy     | 2        |
| total_timesteps    | 6893500  |
| value_loss         | 0.00011  |
---------------------------------
---------------------------------
| explained_variance | 0.899    |
| fps                | 821      |
| nupdates           | 1378800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6894000  |
| value_loss         | 7.59e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0465  |
| fps                | 821      |
| nupdates           | 1378900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.988    |
| fps                | 820      |
| nupdates           | 1381600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6908000  |
| value_loss         | 5.62e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.2     |
| fps                | 820      |
| nupdates           | 1381700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6908500  |
| value_loss         | 0.000345 |
---------------------------------
---------------------------------
| explained_variance | -6.47    |
| fps                | 820      |
| nupdates           | 1381800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6909000  |
| value_loss         | 0.00166  |
---------------------------------
---------------------------------
| explained_variance | -0.719   |
| fps                | 820      |
| nupdates           | 1381900  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.745    |
| fps                | 821      |
| nupdates           | 1384700  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6923500  |
| value_loss         | 4.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 821      |
| nupdates           | 1384800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6924000  |
| value_loss         | 4.28e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.276    |
| fps                | 821      |
| nupdates           | 1384900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6924500  |
| value_loss         | 0.000143 |
---------------------------------
Eval num_timesteps=6925000, episode_reward=-4.60 +/- 0.49
Episode length: 650.60 +/- 195.67
----------------------------------
| explained_variance | -6.77e+03 |
| fps                |

---------------------------------
| explained_variance | 0.96     |
| fps                | 820      |
| nupdates           | 1387700  |
| policy_entropy     | 2.01     |
| total_timesteps    | 6938500  |
| value_loss         | 0.0383   |
---------------------------------
---------------------------------
| explained_variance | -1.19    |
| fps                | 820      |
| nupdates           | 1387800  |
| policy_entropy     | 2.08     |
| total_timesteps    | 6939000  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | -0.0428  |
| fps                | 820      |
| nupdates           | 1387900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6939500  |
| value_loss         | 0.000279 |
---------------------------------
---------------------------------
| explained_variance | 0.498    |
| fps                | 820      |
| nupdates           | 1388000  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.423    |
| fps                | 820      |
| nupdates           | 1390700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 6953500  |
| value_loss         | 0.000761 |
---------------------------------
---------------------------------
| explained_variance | 0.599    |
| fps                | 820      |
| nupdates           | 1390800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6954000  |
| value_loss         | 2.66e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.711    |
| fps                | 820      |
| nupdates           | 1390900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6954500  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | -0.782   |
| fps                | 820      |
| nupdates           | 1391000  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.693    |
| fps                | 820      |
| nupdates           | 1393800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6969000  |
| value_loss         | 8.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.59     |
| fps                | 820      |
| nupdates           | 1393900  |
| policy_entropy     | 1.58     |
| total_timesteps    | 6969500  |
| value_loss         | 0.927    |
---------------------------------
---------------------------------
| explained_variance | -0.262   |
| fps                | 820      |
| nupdates           | 1394000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6970000  |
| value_loss         | 0.000169 |
---------------------------------
---------------------------------
| explained_variance | -1.63    |
| fps                | 820      |
| nupdates           | 1394100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.905    |
| fps                | 820      |
| nupdates           | 1396800  |
| policy_entropy     | 2        |
| total_timesteps    | 6984000  |
| value_loss         | 8.7e-06  |
---------------------------------
---------------------------------
| explained_variance | -0.774   |
| fps                | 820      |
| nupdates           | 1396900  |
| policy_entropy     | 2        |
| total_timesteps    | 6984500  |
| value_loss         | 0.000188 |
---------------------------------
---------------------------------
| explained_variance | 0.967    |
| fps                | 820      |
| nupdates           | 1397000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6985000  |
| value_loss         | 1.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.843    |
| fps                | 820      |
| nupdates           | 1397100  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.158   |
| fps                | 820      |
| nupdates           | 1399900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 6999500  |
| value_loss         | 0.000197 |
---------------------------------
Eval num_timesteps=7000000, episode_reward=-4.80 +/- 0.40
Episode length: 638.00 +/- 114.53
---------------------------------
| explained_variance | 0.535    |
| fps                | 820      |
| nupdates           | 1400000  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7000000  |
| value_loss         | 1.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.915    |
| fps                | 820      |
| nupdates           | 1400100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7000500  |
| value_loss         | 1.57e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.427    |
| fps                | 8

---------------------------------
| explained_variance | -0.132   |
| fps                | 820      |
| nupdates           | 1402900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7014500  |
| value_loss         | 0.00116  |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 820      |
| nupdates           | 1403000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7015000  |
| value_loss         | 4.09e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.71    |
| fps                | 820      |
| nupdates           | 1403100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7015500  |
| value_loss         | 0.00882  |
---------------------------------
---------------------------------
| explained_variance | -6.21    |
| fps                | 820      |
| nupdates           | 1403200  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.479    |
| fps                | 820      |
| nupdates           | 1405900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7029500  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | 0.721    |
| fps                | 820      |
| nupdates           | 1406000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7030000  |
| value_loss         | 0.000133 |
---------------------------------
---------------------------------
| explained_variance | -12.4    |
| fps                | 820      |
| nupdates           | 1406100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7030500  |
| value_loss         | 0.00133  |
---------------------------------
---------------------------------
| explained_variance | -0.0397  |
| fps                | 820      |
| nupdates           | 1406200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.251    |
| fps                | 820      |
| nupdates           | 1409000  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7045000  |
| value_loss         | 0.000332 |
---------------------------------
---------------------------------
| explained_variance | -6.33    |
| fps                | 820      |
| nupdates           | 1409100  |
| policy_entropy     | 2        |
| total_timesteps    | 7045500  |
| value_loss         | 0.00234  |
---------------------------------
---------------------------------
| explained_variance | 0.75     |
| fps                | 820      |
| nupdates           | 1409200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7046000  |
| value_loss         | 1.11e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.94    |
| fps                | 820      |
| nupdates           | 1409300  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.011    |
| fps                | 820      |
| nupdates           | 1412000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7060000  |
| value_loss         | 0.000286 |
---------------------------------
---------------------------------
| explained_variance | -0.598   |
| fps                | 820      |
| nupdates           | 1412100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7060500  |
| value_loss         | 0.000336 |
---------------------------------
---------------------------------
| explained_variance | -0.315   |
| fps                | 820      |
| nupdates           | 1412200  |
| policy_entropy     | 1.98     |
| total_timesteps    | 7061000  |
| value_loss         | 0.000251 |
---------------------------------
---------------------------------
| explained_variance | -0.33    |
| fps                | 820      |
| nupdates           | 1412300  |
| policy_entropy     | 1.89     |
| total_timest

---------------------------------
| explained_variance | -0.241   |
| fps                | 820      |
| nupdates           | 1415100  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7075500  |
| value_loss         | 0.000444 |
---------------------------------
---------------------------------
| explained_variance | 0.933    |
| fps                | 820      |
| nupdates           | 1415200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7076000  |
| value_loss         | 2.9e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.526    |
| fps                | 820      |
| nupdates           | 1415300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7076500  |
| value_loss         | 0.000301 |
---------------------------------
---------------------------------
| explained_variance | 0.973    |
| fps                | 820      |
| nupdates           | 1415400  |
| policy_entropy     | 2.01     |
| total_timest

---------------------------------
| explained_variance | 0.866    |
| fps                | 820      |
| nupdates           | 1418200  |
| policy_entropy     | 1.99     |
| total_timesteps    | 7091000  |
| value_loss         | 2.17e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.515    |
| fps                | 820      |
| nupdates           | 1418300  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7091500  |
| value_loss         | 2.92e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.06    |
| fps                | 820      |
| nupdates           | 1418400  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7092000  |
| value_loss         | 0.000161 |
---------------------------------
---------------------------------
| explained_variance | -0.105   |
| fps                | 820      |
| nupdates           | 1418500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.942    |
| fps                | 820      |
| nupdates           | 1421200  |
| policy_entropy     | 1.99     |
| total_timesteps    | 7106000  |
| value_loss         | 7.41e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.16    |
| fps                | 820      |
| nupdates           | 1421300  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7106500  |
| value_loss         | 0.000328 |
---------------------------------
---------------------------------
| explained_variance | -53.5    |
| fps                | 820      |
| nupdates           | 1421400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7107000  |
| value_loss         | 0.0151   |
---------------------------------
---------------------------------
| explained_variance | 0.519    |
| fps                | 820      |
| nupdates           | 1421500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.66     |
| fps                | 820      |
| nupdates           | 1424300  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7121500  |
| value_loss         | 0.000532 |
---------------------------------
---------------------------------
| explained_variance | 0.942    |
| fps                | 820      |
| nupdates           | 1424400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7122000  |
| value_loss         | 3.96e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.436    |
| fps                | 820      |
| nupdates           | 1424500  |
| policy_entropy     | 0.943    |
| total_timesteps    | 7122500  |
| value_loss         | 0.133    |
---------------------------------
---------------------------------
| explained_variance | 0.894    |
| fps                | 820      |
| nupdates           | 1424600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.39     |
| fps                | 820      |
| nupdates           | 1427300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7136500  |
| value_loss         | 7.82e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 820      |
| nupdates           | 1427400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7137000  |
| value_loss         | 1.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.66    |
| fps                | 820      |
| nupdates           | 1427500  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7137500  |
| value_loss         | 0.00143  |
---------------------------------
---------------------------------
| explained_variance | -2.4     |
| fps                | 820      |
| nupdates           | 1427600  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.793    |
| fps                | 820      |
| nupdates           | 1430300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7151500  |
| value_loss         | 0.000165 |
---------------------------------
---------------------------------
| explained_variance | 0.35     |
| fps                | 820      |
| nupdates           | 1430400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7152000  |
| value_loss         | 0.000289 |
---------------------------------
---------------------------------
| explained_variance | 0.999    |
| fps                | 820      |
| nupdates           | 1430500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7152500  |
| value_loss         | 1.2e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.429   |
| fps                | 820      |
| nupdates           | 1430600  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.567    |
| fps                | 820      |
| nupdates           | 1433400  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7167000  |
| value_loss         | 4.17e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.92     |
| fps                | 820      |
| nupdates           | 1433500  |
| policy_entropy     | 1.97     |
| total_timesteps    | 7167500  |
| value_loss         | 0.000632 |
---------------------------------
---------------------------------
| explained_variance | 0.335    |
| fps                | 820      |
| nupdates           | 1433600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7168000  |
| value_loss         | 0.000246 |
---------------------------------
---------------------------------
| explained_variance | 0.929    |
| fps                | 820      |
| nupdates           | 1433700  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.445   |
| fps                | 820      |
| nupdates           | 1436400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7182000  |
| value_loss         | 0.000213 |
---------------------------------
---------------------------------
| explained_variance | -0.293   |
| fps                | 820      |
| nupdates           | 1436500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7182500  |
| value_loss         | 3.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -10.1    |
| fps                | 820      |
| nupdates           | 1436600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7183000  |
| value_loss         | 0.000389 |
---------------------------------
---------------------------------
| explained_variance | 0.114    |
| fps                | 820      |
| nupdates           | 1436700  |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -0.925   |
| fps                | 820      |
| nupdates           | 1439500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7197500  |
| value_loss         | 4.33e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0867   |
| fps                | 820      |
| nupdates           | 1439600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7198000  |
| value_loss         | 0.000163 |
---------------------------------
---------------------------------
| explained_variance | -1.65    |
| fps                | 820      |
| nupdates           | 1439700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7198500  |
| value_loss         | 6.83e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.015   |
| fps                | 820      |
| nupdates           | 1439800  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.605    |
| fps                | 820      |
| nupdates           | 1442500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7212500  |
| value_loss         | 1.29e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.85    |
| fps                | 820      |
| nupdates           | 1442600  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7213000  |
| value_loss         | 0.000674 |
---------------------------------
---------------------------------
| explained_variance | -0.563   |
| fps                | 820      |
| nupdates           | 1442700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7213500  |
| value_loss         | 0.000456 |
---------------------------------
---------------------------------
| explained_variance | 0.295    |
| fps                | 820      |
| nupdates           | 1442800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -323     |
| fps                | 819      |
| nupdates           | 1445500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7227500  |
| value_loss         | 0.00842  |
---------------------------------
---------------------------------
| explained_variance | -0.135   |
| fps                | 819      |
| nupdates           | 1445600  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7228000  |
| value_loss         | 2.09e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.26    |
| fps                | 819      |
| nupdates           | 1445700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7228500  |
| value_loss         | 0.000367 |
---------------------------------
---------------------------------
| explained_variance | -159     |
| fps                | 819      |
| nupdates           | 1445800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -2.9     |
| fps                | 820      |
| nupdates           | 1448600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7243000  |
| value_loss         | 0.00389  |
---------------------------------
---------------------------------
| explained_variance | 0.316    |
| fps                | 820      |
| nupdates           | 1448700  |
| policy_entropy     | 1.61     |
| total_timesteps    | 7243500  |
| value_loss         | 0.197    |
---------------------------------
---------------------------------
| explained_variance | -0.221   |
| fps                | 820      |
| nupdates           | 1448800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7244000  |
| value_loss         | 9.48e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.477    |
| fps                | 820      |
| nupdates           | 1448900  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.136    |
| fps                | 819      |
| nupdates           | 1451600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7258000  |
| value_loss         | 0.000224 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 819      |
| nupdates           | 1451700  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7258500  |
| value_loss         | 3.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.957    |
| fps                | 819      |
| nupdates           | 1451800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7259000  |
| value_loss         | 3.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.814    |
| fps                | 819      |
| nupdates           | 1451900  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.587   |
| fps                | 819      |
| nupdates           | 1454700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7273500  |
| value_loss         | 0.000553 |
---------------------------------
---------------------------------
| explained_variance | 0.906    |
| fps                | 819      |
| nupdates           | 1454800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7274000  |
| value_loss         | 2.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.821    |
| fps                | 819      |
| nupdates           | 1454900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7274500  |
| value_loss         | 0.000126 |
---------------------------------
Eval num_timesteps=7275000, episode_reward=-4.90 +/- 0.30
Episode length: 575.00 +/- 90.95
---------------------------------
| explained_variance | 0.993    |
| fps                | 81

---------------------------------
| explained_variance | 0.686    |
| fps                | 819      |
| nupdates           | 1457700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7288500  |
| value_loss         | 3.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.586    |
| fps                | 819      |
| nupdates           | 1457800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7289000  |
| value_loss         | 0.000217 |
---------------------------------
---------------------------------
| explained_variance | 0.585    |
| fps                | 819      |
| nupdates           | 1457900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7289500  |
| value_loss         | 0.000226 |
---------------------------------
---------------------------------
| explained_variance | 0.857    |
| fps                | 819      |
| nupdates           | 1458000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.661    |
| fps                | 819      |
| nupdates           | 1460700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7303500  |
| value_loss         | 6.61e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.922    |
| fps                | 819      |
| nupdates           | 1460800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7304000  |
| value_loss         | 3.44e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.817   |
| fps                | 819      |
| nupdates           | 1460900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7304500  |
| value_loss         | 0.000136 |
---------------------------------
---------------------------------
| explained_variance | 0.927    |
| fps                | 819      |
| nupdates           | 1461000  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.522    |
| fps                | 819      |
| nupdates           | 1463800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7319000  |
| value_loss         | 1.57e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.873    |
| fps                | 819      |
| nupdates           | 1463900  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7319500  |
| value_loss         | 8.62e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.622    |
| fps                | 819      |
| nupdates           | 1464000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7320000  |
| value_loss         | 2.2e-05  |
---------------------------------
---------------------------------
| explained_variance | 1        |
| fps                | 819      |
| nupdates           | 1464100  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -10.9    |
| fps                | 819      |
| nupdates           | 1466800  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7334000  |
| value_loss         | 0.00133  |
---------------------------------
---------------------------------
| explained_variance | 0.978    |
| fps                | 819      |
| nupdates           | 1466900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7334500  |
| value_loss         | 3.95e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.957    |
| fps                | 819      |
| nupdates           | 1467000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7335000  |
| value_loss         | 4.17e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.826    |
| fps                | 819      |
| nupdates           | 1467100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.378    |
| fps                | 819      |
| nupdates           | 1469900  |
| policy_entropy     | 1.99     |
| total_timesteps    | 7349500  |
| value_loss         | 0.162    |
---------------------------------
Eval num_timesteps=7350000, episode_reward=-4.90 +/- 0.30
Episode length: 589.60 +/- 146.38
----------------------------------
| explained_variance | -1.18e+03 |
| fps                | 819       |
| nupdates           | 1470000   |
| policy_entropy     | 1.99      |
| total_timesteps    | 7350000   |
| value_loss         | 0.0687    |
----------------------------------
---------------------------------
| explained_variance | 0.807    |
| fps                | 819      |
| nupdates           | 1470100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7350500  |
| value_loss         | 1.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.882    |
| fps           

---------------------------------
| explained_variance | 0.757    |
| fps                | 819      |
| nupdates           | 1472900  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7364500  |
| value_loss         | 3.99e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 819      |
| nupdates           | 1473000  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7365000  |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | 0.813    |
| fps                | 819      |
| nupdates           | 1473100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7365500  |
| value_loss         | 2.33e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.72    |
| fps                | 819      |
| nupdates           | 1473200  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.0795   |
| fps                | 818      |
| nupdates           | 1475900  |
| policy_entropy     | 1.96     |
| total_timesteps    | 7379500  |
| value_loss         | 0.000259 |
---------------------------------
---------------------------------
| explained_variance | -0.405   |
| fps                | 818      |
| nupdates           | 1476000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7380000  |
| value_loss         | 5.11e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.433   |
| fps                | 818      |
| nupdates           | 1476100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7380500  |
| value_loss         | 0.000342 |
---------------------------------
---------------------------------
| explained_variance | 0.611    |
| fps                | 818      |
| nupdates           | 1476200  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.134   |
| fps                | 819      |
| nupdates           | 1479000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7395000  |
| value_loss         | 1.24e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.11    |
| fps                | 819      |
| nupdates           | 1479100  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7395500  |
| value_loss         | 0.000561 |
---------------------------------
---------------------------------
| explained_variance | 0.904    |
| fps                | 819      |
| nupdates           | 1479200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7396000  |
| value_loss         | 8.11e-06 |
---------------------------------
----------------------------------
| explained_variance | -0.000175 |
| fps                | 819       |
| nupdates           | 1479300   |
| policy_entropy     | 0.54      |
| total_t

---------------------------------
| explained_variance | -5.35    |
| fps                | 818      |
| nupdates           | 1482000  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7410000  |
| value_loss         | 0.000343 |
---------------------------------
---------------------------------
| explained_variance | -2.74    |
| fps                | 818      |
| nupdates           | 1482100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7410500  |
| value_loss         | 0.000389 |
---------------------------------
---------------------------------
| explained_variance | 0.615    |
| fps                | 818      |
| nupdates           | 1482200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7411000  |
| value_loss         | 2.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.853    |
| fps                | 818      |
| nupdates           | 1482300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.342    |
| fps                | 818      |
| nupdates           | 1485100  |
| policy_entropy     | 1.79     |
| total_timesteps    | 7425500  |
| value_loss         | 0.181    |
---------------------------------
---------------------------------
| explained_variance | 0.0243   |
| fps                | 818      |
| nupdates           | 1485200  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7426000  |
| value_loss         | 0.000153 |
---------------------------------
---------------------------------
| explained_variance | -0.00887 |
| fps                | 818      |
| nupdates           | 1485300  |
| policy_entropy     | 1.69     |
| total_timesteps    | 7426500  |
| value_loss         | 0.165    |
---------------------------------
---------------------------------
| explained_variance | 0.948    |
| fps                | 818      |
| nupdates           | 1485400  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.93     |
| fps                | 818      |
| nupdates           | 1488200  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7441000  |
| value_loss         | 0.000206 |
---------------------------------
---------------------------------
| explained_variance | -0.427   |
| fps                | 818      |
| nupdates           | 1488300  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7441500  |
| value_loss         | 7.38e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 818      |
| nupdates           | 1488400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7442000  |
| value_loss         | 2.5e-07  |
---------------------------------
---------------------------------
| explained_variance | -0.196   |
| fps                | 818      |
| nupdates           | 1488500  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.745   |
| fps                | 818      |
| nupdates           | 1491200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7456000  |
| value_loss         | 4.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.782    |
| fps                | 818      |
| nupdates           | 1491300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7456500  |
| value_loss         | 0.000138 |
---------------------------------
---------------------------------
| explained_variance | 0.929    |
| fps                | 818      |
| nupdates           | 1491400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7457000  |
| value_loss         | 3.89e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.435    |
| fps                | 818      |
| nupdates           | 1491500  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.188   |
| fps                | 818      |
| nupdates           | 1494300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7471500  |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | 0.304    |
| fps                | 818      |
| nupdates           | 1494400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7472000  |
| value_loss         | 0.000191 |
---------------------------------
---------------------------------
| explained_variance | -0.74    |
| fps                | 818      |
| nupdates           | 1494500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7472500  |
| value_loss         | 0.000881 |
---------------------------------
---------------------------------
| explained_variance | 0.941    |
| fps                | 819      |
| nupdates           | 1494600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.924   |
| fps                | 818      |
| nupdates           | 1497300  |
| policy_entropy     | 1.97     |
| total_timesteps    | 7486500  |
| value_loss         | 0.00363  |
---------------------------------
---------------------------------
| explained_variance | -7.25    |
| fps                | 818      |
| nupdates           | 1497400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7487000  |
| value_loss         | 0.00082  |
---------------------------------
---------------------------------
| explained_variance | 0.267    |
| fps                | 818      |
| nupdates           | 1497500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7487500  |
| value_loss         | 0.000138 |
---------------------------------
---------------------------------
| explained_variance | -0.14    |
| fps                | 818      |
| nupdates           | 1497600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -11.3    |
| fps                | 818      |
| nupdates           | 1500300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7501500  |
| value_loss         | 0.000458 |
---------------------------------
---------------------------------
| explained_variance | -0.251   |
| fps                | 818      |
| nupdates           | 1500400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7502000  |
| value_loss         | 6.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.819    |
| fps                | 818      |
| nupdates           | 1500500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7502500  |
| value_loss         | 0.000173 |
---------------------------------
---------------------------------
| explained_variance | -0.919   |
| fps                | 818      |
| nupdates           | 1500600  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -26.3    |
| fps                | 818      |
| nupdates           | 1503400  |
| policy_entropy     | 1.95     |
| total_timesteps    | 7517000  |
| value_loss         | 0.00329  |
---------------------------------
---------------------------------
| explained_variance | -0.198   |
| fps                | 818      |
| nupdates           | 1503500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7517500  |
| value_loss         | 0.000692 |
---------------------------------
---------------------------------
| explained_variance | -0.498   |
| fps                | 818      |
| nupdates           | 1503600  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7518000  |
| value_loss         | 0.000102 |
---------------------------------
---------------------------------
| explained_variance | 0.928    |
| fps                | 818      |
| nupdates           | 1503700  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.451    |
| fps                | 818      |
| nupdates           | 1506400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7532000  |
| value_loss         | 5.36e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.342    |
| fps                | 818      |
| nupdates           | 1506500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7532500  |
| value_loss         | 0.0007   |
---------------------------------
---------------------------------
| explained_variance | 0.935    |
| fps                | 818      |
| nupdates           | 1506600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7533000  |
| value_loss         | 8.46e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.316    |
| fps                | 818      |
| nupdates           | 1506700  |
| policy_entropy     | 0.505    |
| total_timest

---------------------------------
| explained_variance | 0.521    |
| fps                | 818      |
| nupdates           | 1509500  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7547500  |
| value_loss         | 3.21e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.1     |
| fps                | 818      |
| nupdates           | 1509600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7548000  |
| value_loss         | 0.000424 |
---------------------------------
---------------------------------
| explained_variance | 0.366    |
| fps                | 818      |
| nupdates           | 1509700  |
| policy_entropy     | 0.847    |
| total_timesteps    | 7548500  |
| value_loss         | 0.153    |
---------------------------------
---------------------------------
| explained_variance | -87.5    |
| fps                | 818      |
| nupdates           | 1509800  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.9      |
| fps                | 818      |
| nupdates           | 1512500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7562500  |
| value_loss         | 3.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.234    |
| fps                | 818      |
| nupdates           | 1512600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7563000  |
| value_loss         | 0.000129 |
---------------------------------
---------------------------------
| explained_variance | -1.76    |
| fps                | 818      |
| nupdates           | 1512700  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7563500  |
| value_loss         | 0.000196 |
---------------------------------
---------------------------------
| explained_variance | 0.854    |
| fps                | 818      |
| nupdates           | 1512800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -110     |
| fps                | 818      |
| nupdates           | 1515500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7577500  |
| value_loss         | 0.0164   |
---------------------------------
---------------------------------
| explained_variance | 0.729    |
| fps                | 818      |
| nupdates           | 1515600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7578000  |
| value_loss         | 5.01e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.912    |
| fps                | 818      |
| nupdates           | 1515700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7578500  |
| value_loss         | 4.42e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.981    |
| fps                | 818      |
| nupdates           | 1515800  |
| policy_entropy     | 2.06     |
| total_timest

----------------------------------
| explained_variance | -4.39e+03 |
| fps                | 818       |
| nupdates           | 1518600   |
| policy_entropy     | 2.02      |
| total_timesteps    | 7593000   |
| value_loss         | 0.124     |
----------------------------------
---------------------------------
| explained_variance | -8.3     |
| fps                | 818      |
| nupdates           | 1518700  |
| policy_entropy     | 2.01     |
| total_timesteps    | 7593500  |
| value_loss         | 0.00597  |
---------------------------------
---------------------------------
| explained_variance | 0.901    |
| fps                | 818      |
| nupdates           | 1518800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7594000  |
| value_loss         | 4.66e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.702    |
| fps                | 818      |
| nupdates           | 1518900  |
| policy_entropy     | 2.05     |
| tota

---------------------------------
| explained_variance | 0.964    |
| fps                | 818      |
| nupdates           | 1521600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7608000  |
| value_loss         | 1.08e-05 |
---------------------------------
---------------------------------
| explained_variance | -19.1    |
| fps                | 818      |
| nupdates           | 1521700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7608500  |
| value_loss         | 0.0192   |
---------------------------------
---------------------------------
| explained_variance | 0.192    |
| fps                | 818      |
| nupdates           | 1521800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7609000  |
| value_loss         | 0.000973 |
---------------------------------
---------------------------------
| explained_variance | 0.757    |
| fps                | 818      |
| nupdates           | 1521900  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.856    |
| fps                | 818      |
| nupdates           | 1524700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7623500  |
| value_loss         | 2.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.921   |
| fps                | 818      |
| nupdates           | 1524800  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7624000  |
| value_loss         | 0.000251 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 818      |
| nupdates           | 1524900  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7624500  |
| value_loss         | 9.95e-05 |
---------------------------------
Eval num_timesteps=7625000, episode_reward=-4.90 +/- 0.30
Episode length: 561.40 +/- 93.67
---------------------------------
| explained_variance | 0.984    |
| fps                | 81

---------------------------------
| explained_variance | 0.993    |
| fps                | 818      |
| nupdates           | 1527700  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7638500  |
| value_loss         | 6.99e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.516    |
| fps                | 818      |
| nupdates           | 1527800  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7639000  |
| value_loss         | 6.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 818      |
| nupdates           | 1527900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7639500  |
| value_loss         | 1.04e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 818      |
| nupdates           | 1528000  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.456    |
| fps                | 818      |
| nupdates           | 1530700  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7653500  |
| value_loss         | 1.89e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.348   |
| fps                | 818      |
| nupdates           | 1530800  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7654000  |
| value_loss         | 0.000232 |
---------------------------------
---------------------------------
| explained_variance | 0.895    |
| fps                | 818      |
| nupdates           | 1530900  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7654500  |
| value_loss         | 5.27e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0838  |
| fps                | 818      |
| nupdates           | 1531000  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.597    |
| fps                | 818      |
| nupdates           | 1533800  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7669000  |
| value_loss         | 3.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.655    |
| fps                | 818      |
| nupdates           | 1533900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7669500  |
| value_loss         | 2.69e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.52    |
| fps                | 818      |
| nupdates           | 1534000  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7670000  |
| value_loss         | 0.000211 |
---------------------------------
---------------------------------
| explained_variance | 0.729    |
| fps                | 818      |
| nupdates           | 1534100  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0371  |
| fps                | 818      |
| nupdates           | 1536800  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7684000  |
| value_loss         | 0.000206 |
---------------------------------
---------------------------------
| explained_variance | 0.623    |
| fps                | 818      |
| nupdates           | 1536900  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7684500  |
| value_loss         | 3.97e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.508    |
| fps                | 818      |
| nupdates           | 1537000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7685000  |
| value_loss         | 2.78e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.68    |
| fps                | 818      |
| nupdates           | 1537100  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.597   |
| fps                | 818      |
| nupdates           | 1539900  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7699500  |
| value_loss         | 0.000325 |
---------------------------------
Eval num_timesteps=7700000, episode_reward=-5.00 +/- 0.00
Episode length: 624.70 +/- 127.42
---------------------------------
| explained_variance | 0.409    |
| fps                | 818      |
| nupdates           | 1540000  |
| policy_entropy     | 1.87     |
| total_timesteps    | 7700000  |
| value_loss         | 0.92     |
---------------------------------
---------------------------------
| explained_variance | 0.103    |
| fps                | 818      |
| nupdates           | 1540100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7700500  |
| value_loss         | 0.000526 |
---------------------------------
---------------------------------
| explained_variance | 0.962    |
| fps                | 8

---------------------------------
| explained_variance | 0.592    |
| fps                | 818      |
| nupdates           | 1542900  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7714500  |
| value_loss         | 1.04e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.117   |
| fps                | 818      |
| nupdates           | 1543000  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7715000  |
| value_loss         | 0.000285 |
---------------------------------
---------------------------------
| explained_variance | 0.0947   |
| fps                | 818      |
| nupdates           | 1543100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7715500  |
| value_loss         | 0.000278 |
---------------------------------
---------------------------------
| explained_variance | 0.987    |
| fps                | 818      |
| nupdates           | 1543200  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.55    |
| fps                | 818      |
| nupdates           | 1545900  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7729500  |
| value_loss         | 0.00109  |
---------------------------------
---------------------------------
| explained_variance | -1.3     |
| fps                | 818      |
| nupdates           | 1546000  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7730000  |
| value_loss         | 0.000339 |
---------------------------------
---------------------------------
| explained_variance | 0.801    |
| fps                | 818      |
| nupdates           | 1546100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7730500  |
| value_loss         | 8.15e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0123   |
| fps                | 818      |
| nupdates           | 1546200  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.21    |
| fps                | 818      |
| nupdates           | 1549000  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7745000  |
| value_loss         | 0.000276 |
---------------------------------
---------------------------------
| explained_variance | -1.31    |
| fps                | 818      |
| nupdates           | 1549100  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7745500  |
| value_loss         | 0.000573 |
---------------------------------
---------------------------------
| explained_variance | -0.479   |
| fps                | 818      |
| nupdates           | 1549200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7746000  |
| value_loss         | 4.9e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.985    |
| fps                | 818      |
| nupdates           | 1549300  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.996    |
| fps                | 818      |
| nupdates           | 1552000  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7760000  |
| value_loss         | 4.19e-06 |
---------------------------------
---------------------------------
| explained_variance | -1.51    |
| fps                | 818      |
| nupdates           | 1552100  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7760500  |
| value_loss         | 3.67e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.787    |
| fps                | 818      |
| nupdates           | 1552200  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7761000  |
| value_loss         | 8.53e-05 |
---------------------------------
---------------------------------
| explained_variance | -73.1    |
| fps                | 818      |
| nupdates           | 1552300  |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.684    |
| fps                | 817      |
| nupdates           | 1555100  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7775500  |
| value_loss         | 6.63e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.05    |
| fps                | 817      |
| nupdates           | 1555200  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7776000  |
| value_loss         | 0.00121  |
---------------------------------
---------------------------------
| explained_variance | -0.00257 |
| fps                | 817      |
| nupdates           | 1555300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7776500  |
| value_loss         | 0.00024  |
---------------------------------
---------------------------------
| explained_variance | -94.6    |
| fps                | 817      |
| nupdates           | 1555400  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.521    |
| fps                | 817      |
| nupdates           | 1558200  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7791000  |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | 0.675    |
| fps                | 817      |
| nupdates           | 1558300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7791500  |
| value_loss         | 0.000152 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 817      |
| nupdates           | 1558400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7792000  |
| value_loss         | 8.14e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.81    |
| fps                | 817      |
| nupdates           | 1558500  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.882    |
| fps                | 816      |
| nupdates           | 1561200  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7806000  |
| value_loss         | 8.77e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.667    |
| fps                | 816      |
| nupdates           | 1561300  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7806500  |
| value_loss         | 0.000119 |
---------------------------------
---------------------------------
| explained_variance | -111     |
| fps                | 816      |
| nupdates           | 1561400  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7807000  |
| value_loss         | 0.00391  |
---------------------------------
---------------------------------
| explained_variance | -1.89    |
| fps                | 816      |
| nupdates           | 1561500  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.953    |
| fps                | 816      |
| nupdates           | 1564300  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7821500  |
| value_loss         | 8.71e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.61     |
| fps                | 815      |
| nupdates           | 1564400  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7822000  |
| value_loss         | 0.000183 |
---------------------------------
---------------------------------
| explained_variance | -0.469   |
| fps                | 815      |
| nupdates           | 1564500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7822500  |
| value_loss         | 6.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -11.2    |
| fps                | 815      |
| nupdates           | 1564600  |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.626    |
| fps                | 814      |
| nupdates           | 1567300  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7836500  |
| value_loss         | 0.000594 |
---------------------------------
---------------------------------
| explained_variance | -0.353   |
| fps                | 814      |
| nupdates           | 1567400  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7837000  |
| value_loss         | 0.00122  |
---------------------------------
---------------------------------
| explained_variance | 0.959    |
| fps                | 814      |
| nupdates           | 1567500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7837500  |
| value_loss         | 5.15e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.99     |
| fps                | 814      |
| nupdates           | 1567600  |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -6.12    |
| fps                | 813      |
| nupdates           | 1570300  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7851500  |
| value_loss         | 0.001    |
---------------------------------
---------------------------------
| explained_variance | -3.87    |
| fps                | 813      |
| nupdates           | 1570400  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7852000  |
| value_loss         | 0.000467 |
---------------------------------
---------------------------------
| explained_variance | -8.38    |
| fps                | 813      |
| nupdates           | 1570500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7852500  |
| value_loss         | 0.00236  |
---------------------------------
---------------------------------
| explained_variance | 0.421    |
| fps                | 813      |
| nupdates           | 1570600  |
| policy_entropy     | 1.26     |
| total_timest

---------------------------------
| explained_variance | 0.347    |
| fps                | 812      |
| nupdates           | 1573400  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7867000  |
| value_loss         | 0.000164 |
---------------------------------
---------------------------------
| explained_variance | 0.8      |
| fps                | 812      |
| nupdates           | 1573500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7867500  |
| value_loss         | 0.000159 |
---------------------------------
---------------------------------
| explained_variance | 0.64     |
| fps                | 812      |
| nupdates           | 1573600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7868000  |
| value_loss         | 1.49e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.947    |
| fps                | 812      |
| nupdates           | 1573700  |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -12.6    |
| fps                | 811      |
| nupdates           | 1576400  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7882000  |
| value_loss         | 0.0103   |
---------------------------------
---------------------------------
| explained_variance | 0.596    |
| fps                | 811      |
| nupdates           | 1576500  |
| policy_entropy     | 2.04     |
| total_timesteps    | 7882500  |
| value_loss         | 5.44e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.79    |
| fps                | 811      |
| nupdates           | 1576600  |
| policy_entropy     | 2.08     |
| total_timesteps    | 7883000  |
| value_loss         | 0.00017  |
---------------------------------
---------------------------------
| explained_variance | -0.211   |
| fps                | 811      |
| nupdates           | 1576700  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.988    |
| fps                | 811      |
| nupdates           | 1579500  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7897500  |
| value_loss         | 1.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 811      |
| nupdates           | 1579600  |
| policy_entropy     | 2.07     |
| total_timesteps    | 7898000  |
| value_loss         | 6.9e-06  |
---------------------------------
---------------------------------
| explained_variance | -301     |
| fps                | 811      |
| nupdates           | 1579700  |
| policy_entropy     | 2.02     |
| total_timesteps    | 7898500  |
| value_loss         | 0.00427  |
---------------------------------
---------------------------------
| explained_variance | 0.134    |
| fps                | 811      |
| nupdates           | 1579800  |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.178   |
| fps                | 809      |
| nupdates           | 1582500  |
| policy_entropy     | 2.05     |
| total_timesteps    | 7912500  |
| value_loss         | 3.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.667    |
| fps                | 809      |
| nupdates           | 1582600  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7913000  |
| value_loss         | 0.000452 |
---------------------------------
---------------------------------
| explained_variance | -7.6     |
| fps                | 809      |
| nupdates           | 1582700  |
| policy_entropy     | 2.03     |
| total_timesteps    | 7913500  |
| value_loss         | 0.00308  |
---------------------------------
---------------------------------
| explained_variance | -0.489   |
| fps                | 809      |
| nupdates           | 1582800  |
| policy_entropy     | 2        |
| total_timest

---------------------------------
| explained_variance | 0.899    |
| fps                | 808      |
| nupdates           | 1585500  |
| policy_entropy     | 2.06     |
| total_timesteps    | 7927500  |
| value_loss         | 1.15e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.603   |
| fps                | 808      |
| nupdates           | 1585600  |
| policy_entropy     | 1.99     |
| total_timesteps    | 7928000  |
| value_loss         | 0.000149 |
---------------------------------


KeyboardInterrupt: 

In [12]:
model_str = 'a2c'
LOGDIR = "sb-" + model_str
trained_model['a2c'].save(os.path.join(LOGDIR, "final_model"))

In [13]:
video_filename = 'a2c.mp4'
record_game(
    model=trained_model['a2c'],
    env=gym.make("SlimeVolley-v0"),
    num_episodes=5,
    video_filename=video_filename
)
embed_mp4(video_filename)



score: -5
score: -4
score: -5
score: -5
score: -5
