# Stable-baselines algorithms experiment iteration

Algorithms
* A2C (no replay memory)
* ACER (no multibinary)
* ACKTR
* DDPG (continuous only)
* DQN (discrete action space only)
* HER (method wrapper for off-policy methods)
* GAIL (no multibinary)
* PPO
* SAC (continuous only)
* TD3 (continuous only)
* TRPO

In [1]:
import base64
import IPython
import imageio

def embed_mp4(filename):
    """Embeds an mp4 file in the notebook."""
    video = open(filename,'rb').read()
    b64 = base64.b64encode(video)
    tag = '''
    <video width="640" height="480" controls>
    <source src="data:video/mp4;base64,{0}" type="video/mp4">
    Your browser does not support the video tag.
    </video>'''.format(b64.decode())

    return IPython.display.HTML(tag)

def record_game(model, env, num_episodes=5, video_filename='video.mp4'):
    with imageio.get_writer(video_filename, fps=60) as video:
        for _ in range(num_episodes):
            obs = env.reset()
            done = False
            total_reward = 0
            video.append_data(env.render('rgb_array'))

            while not done:
                action, _steps = model.predict(obs)
                obs, reward, done, info = env.step(action)
                total_reward += reward
                video.append_data(env.render('rgb_array'))

            print("score:", total_reward)

In [2]:
import os
import gym
import slimevolleygym
from slimevolleygym import SurvivalRewardEnv

from stable_baselines.common.policies import MlpPolicy
from stable_baselines import logger
from stable_baselines.common.callbacks import EvalCallback

from stable_baselines.ppo1 import PPO1
from stable_baselines import A2C, ACER, ACKTR, DQN, HER, GAIL, TRPO

algo = {
    'a2c': A2C,
    'acer': ACER,
    'acktr': ACKTR,
    'dqn': DQN,
    'her': HER,
    'gail': GAIL,
    'trpo': TRPO,
}
trained_model = {}

The TensorFlow contrib module will not be included in TensorFlow 2.0.
For more information, please see:
  * https://github.com/tensorflow/community/blob/master/rfcs/20180907-contrib-sunset.md
  * https://github.com/tensorflow/addons
  * https://github.com/tensorflow/io (for I/O related ops)
If you depend on functionality not listed there, please file an issue.



In [8]:
def experiment(model_str, timesteps=15_000_000):
    NUM_TIMESTEPS = int(timesteps)
    SEED = 721
    EVAL_FREQ = 25000
    EVAL_EPISODES = 10  # was 1000
    LOGDIR = "sb-" + model_str

    logger.configure(folder=LOGDIR)
    env = gym.make("SlimeVolley-v0")
    env.seed(SEED)

    model = algo[model_str](MlpPolicy, env, verbose=2)
    trained_model[model_str] = model
    eval_callback = EvalCallback(env, best_model_save_path=LOGDIR, log_path=LOGDIR, eval_freq=EVAL_FREQ, n_eval_episodes=EVAL_EPISODES)
    model.learn(total_timesteps=NUM_TIMESTEPS, callback=eval_callback)
    model.save(os.path.join(LOGDIR, "final_model")) # probably never get to this point.
    env.close()

In [None]:
experiment('a2c')

Logging to sb-a2c
Wrapping the env in a DummyVecEnv.
----------------------------------
| explained_variance | -5.23e+03 |
| fps                | 33        |
| nupdates           | 1         |
| policy_entropy     | 2.08      |
| total_timesteps    | 5         |
| value_loss         | 0.107     |
----------------------------------
---------------------------------
| explained_variance | -246     |
| fps                | 767      |
| nupdates           | 100      |
| policy_entropy     | 2.08     |
| total_timesteps    | 500      |
| value_loss         | 0.000801 |
---------------------------------
---------------------------------
| explained_variance | -4.9e+03 |
| fps                | 881      |
| nupdates           | 200      |
| policy_entropy     | 2.08     |
| total_timesteps    | 1000     |
| value_loss         | 0.0119   |
---------------------------------
---------------------------------
| explained_variance | -5.79    |
| fps                | 930      |
| nupdates           

---------------------------------
| explained_variance | -12      |
| fps                | 1013     |
| nupdates           | 3000     |
| policy_entropy     | 2.01     |
| total_timesteps    | 15000    |
| value_loss         | 0.000368 |
---------------------------------
---------------------------------
| explained_variance | 0.487    |
| fps                | 1013     |
| nupdates           | 3100     |
| policy_entropy     | 2.05     |
| total_timesteps    | 15500    |
| value_loss         | 0.00196  |
---------------------------------
---------------------------------
| explained_variance | -5.68    |
| fps                | 1012     |
| nupdates           | 3200     |
| policy_entropy     | 2.02     |
| total_timesteps    | 16000    |
| value_loss         | 0.000413 |
---------------------------------
---------------------------------
| explained_variance | -910     |
| fps                | 1012     |
| nupdates           | 3300     |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -3.96    |
| fps                | 919      |
| nupdates           | 6000     |
| policy_entropy     | 2.06     |
| total_timesteps    | 30000    |
| value_loss         | 0.000334 |
---------------------------------
---------------------------------
| explained_variance | 0.977    |
| fps                | 920      |
| nupdates           | 6100     |
| policy_entropy     | 2        |
| total_timesteps    | 30500    |
| value_loss         | 8.73e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.744    |
| fps                | 922      |
| nupdates           | 6200     |
| policy_entropy     | 2.07     |
| total_timesteps    | 31000    |
| value_loss         | 2.59e-05 |
---------------------------------
---------------------------------
| explained_variance | -77.4    |
| fps                | 924      |
| nupdates           | 6300     |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -1.38    |
| fps                | 959      |
| nupdates           | 9100     |
| policy_entropy     | 2.07     |
| total_timesteps    | 45500    |
| value_loss         | 0.00128  |
---------------------------------
---------------------------------
| explained_variance | -3.57    |
| fps                | 960      |
| nupdates           | 9200     |
| policy_entropy     | 2.07     |
| total_timesteps    | 46000    |
| value_loss         | 0.0013   |
---------------------------------
---------------------------------
| explained_variance | -19.5    |
| fps                | 960      |
| nupdates           | 9300     |
| policy_entropy     | 2.05     |
| total_timesteps    | 46500    |
| value_loss         | 0.000282 |
---------------------------------
---------------------------------
| explained_variance | -24.8    |
| fps                | 959      |
| nupdates           | 9400     |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.16    |
| fps                | 926      |
| nupdates           | 12100    |
| policy_entropy     | 2.07     |
| total_timesteps    | 60500    |
| value_loss         | 0.00135  |
---------------------------------
---------------------------------
| explained_variance | -24.6    |
| fps                | 927      |
| nupdates           | 12200    |
| policy_entropy     | 2.05     |
| total_timesteps    | 61000    |
| value_loss         | 0.00143  |
---------------------------------
---------------------------------
| explained_variance | -371     |
| fps                | 928      |
| nupdates           | 12300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 61500    |
| value_loss         | 0.0631   |
---------------------------------
---------------------------------
| explained_variance | -0.183   |
| fps                | 929      |
| nupdates           | 12400    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.6     |
| fps                | 906      |
| nupdates           | 15100    |
| policy_entropy     | 2.05     |
| total_timesteps    | 75500    |
| value_loss         | 0.000275 |
---------------------------------
---------------------------------
| explained_variance | -14.6    |
| fps                | 907      |
| nupdates           | 15200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 76000    |
| value_loss         | 0.00079  |
---------------------------------
---------------------------------
| explained_variance | -2.16    |
| fps                | 908      |
| nupdates           | 15300    |
| policy_entropy     | 2.06     |
| total_timesteps    | 76500    |
| value_loss         | 0.00339  |
---------------------------------
---------------------------------
| explained_variance | 0.597    |
| fps                | 909      |
| nupdates           | 15400    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -2.1     |
| fps                | 930      |
| nupdates           | 18200    |
| policy_entropy     | 2.06     |
| total_timesteps    | 91000    |
| value_loss         | 9.14e-05 |
---------------------------------
----------------------------------
| explained_variance | -2.79e+03 |
| fps                | 930       |
| nupdates           | 18300     |
| policy_entropy     | 2.05      |
| total_timesteps    | 91500     |
| value_loss         | 0.15      |
----------------------------------
---------------------------------
| explained_variance | 0.842    |
| fps                | 931      |
| nupdates           | 18400    |
| policy_entropy     | 2.04     |
| total_timesteps    | 92000    |
| value_loss         | 0.000227 |
---------------------------------
---------------------------------
| explained_variance | 0.708    |
| fps                | 932      |
| nupdates           | 18500    |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | -102     |
| fps                | 917      |
| nupdates           | 21200    |
| policy_entropy     | 2.05     |
| total_timesteps    | 106000   |
| value_loss         | 0.0238   |
---------------------------------
---------------------------------
| explained_variance | -2.23    |
| fps                | 917      |
| nupdates           | 21300    |
| policy_entropy     | 2.08     |
| total_timesteps    | 106500   |
| value_loss         | 0.00012  |
---------------------------------
---------------------------------
| explained_variance | -2.99    |
| fps                | 918      |
| nupdates           | 21400    |
| policy_entropy     | 2.06     |
| total_timesteps    | 107000   |
| value_loss         | 0.000162 |
---------------------------------
---------------------------------
| explained_variance | 0.0693   |
| fps                | 919      |
| nupdates           | 21500    |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -11.8    |
| fps                | 932      |
| nupdates           | 24300    |
| policy_entropy     | 2.05     |
| total_timesteps    | 121500   |
| value_loss         | 0.000675 |
---------------------------------
---------------------------------
| explained_variance | -1.41    |
| fps                | 933      |
| nupdates           | 24400    |
| policy_entropy     | 2.08     |
| total_timesteps    | 122000   |
| value_loss         | 0.00102  |
---------------------------------
---------------------------------
| explained_variance | -2.21    |
| fps                | 933      |
| nupdates           | 24500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 122500   |
| value_loss         | 0.00017  |
---------------------------------
---------------------------------
| explained_variance | -2.72    |
| fps                | 933      |
| nupdates           | 24600    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.365    |
| fps                | 925      |
| nupdates           | 27300    |
| policy_entropy     | 2.01     |
| total_timesteps    | 136500   |
| value_loss         | 0.0994   |
---------------------------------
---------------------------------
| explained_variance | -1.67    |
| fps                | 925      |
| nupdates           | 27400    |
| policy_entropy     | 2.07     |
| total_timesteps    | 137000   |
| value_loss         | 0.000825 |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 925      |
| nupdates           | 27500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 137500   |
| value_loss         | 5.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.613    |
| fps                | 926      |
| nupdates           | 27600    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.74    |
| fps                | 919      |
| nupdates           | 30300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 151500   |
| value_loss         | 0.00117  |
---------------------------------
---------------------------------
| explained_variance | -0.127   |
| fps                | 919      |
| nupdates           | 30400    |
| policy_entropy     | 2.05     |
| total_timesteps    | 152000   |
| value_loss         | 0.00037  |
---------------------------------
---------------------------------
| explained_variance | 0.427    |
| fps                | 920      |
| nupdates           | 30500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 152500   |
| value_loss         | 0.137    |
---------------------------------
---------------------------------
| explained_variance | 0.806    |
| fps                | 920      |
| nupdates           | 30600    |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.213    |
| fps                | 931      |
| nupdates           | 33400    |
| policy_entropy     | 2.03     |
| total_timesteps    | 167000   |
| value_loss         | 0.000471 |
---------------------------------
---------------------------------
| explained_variance | -44.4    |
| fps                | 931      |
| nupdates           | 33500    |
| policy_entropy     | 2.03     |
| total_timesteps    | 167500   |
| value_loss         | 0.000398 |
---------------------------------
---------------------------------
| explained_variance | 0.895    |
| fps                | 932      |
| nupdates           | 33600    |
| policy_entropy     | 2.05     |
| total_timesteps    | 168000   |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | -27.9    |
| fps                | 932      |
| nupdates           | 33700    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.454    |
| fps                | 924      |
| nupdates           | 36400    |
| policy_entropy     | 2.05     |
| total_timesteps    | 182000   |
| value_loss         | 0.000376 |
---------------------------------
---------------------------------
| explained_variance | -2.81    |
| fps                | 924      |
| nupdates           | 36500    |
| policy_entropy     | 2.07     |
| total_timesteps    | 182500   |
| value_loss         | 0.000693 |
---------------------------------
---------------------------------
| explained_variance | 0.581    |
| fps                | 925      |
| nupdates           | 36600    |
| policy_entropy     | 2.05     |
| total_timesteps    | 183000   |
| value_loss         | 4.67e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.08    |
| fps                | 925      |
| nupdates           | 36700    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.6     |
| fps                | 932      |
| nupdates           | 39500    |
| policy_entropy     | 2.04     |
| total_timesteps    | 197500   |
| value_loss         | 0.000267 |
---------------------------------
---------------------------------
| explained_variance | 0.592    |
| fps                | 933      |
| nupdates           | 39600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 198000   |
| value_loss         | 0.000262 |
---------------------------------
---------------------------------
| explained_variance | 0.777    |
| fps                | 933      |
| nupdates           | 39700    |
| policy_entropy     | 2.01     |
| total_timesteps    | 198500   |
| value_loss         | 3.13e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.702    |
| fps                | 933      |
| nupdates           | 39800    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.504   |
| fps                | 925      |
| nupdates           | 42500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 212500   |
| value_loss         | 0.000888 |
---------------------------------
---------------------------------
| explained_variance | -4.35    |
| fps                | 925      |
| nupdates           | 42600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 213000   |
| value_loss         | 0.002    |
---------------------------------
---------------------------------
| explained_variance | 0.379    |
| fps                | 925      |
| nupdates           | 42700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 213500   |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | -1.27    |
| fps                | 925      |
| nupdates           | 42800    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.57    |
| fps                | 920      |
| nupdates           | 45500    |
| policy_entropy     | 2.07     |
| total_timesteps    | 227500   |
| value_loss         | 0.000511 |
---------------------------------
---------------------------------
| explained_variance | -11.5    |
| fps                | 920      |
| nupdates           | 45600    |
| policy_entropy     | 2.06     |
| total_timesteps    | 228000   |
| value_loss         | 0.000448 |
---------------------------------
---------------------------------
| explained_variance | -0.524   |
| fps                | 920      |
| nupdates           | 45700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 228500   |
| value_loss         | 0.000425 |
---------------------------------
---------------------------------
| explained_variance | -0.467   |
| fps                | 920      |
| nupdates           | 45800    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.48    |
| fps                | 927      |
| nupdates           | 48600    |
| policy_entropy     | 2.05     |
| total_timesteps    | 243000   |
| value_loss         | 0.000225 |
---------------------------------
---------------------------------
| explained_variance | 0.131    |
| fps                | 928      |
| nupdates           | 48700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 243500   |
| value_loss         | 0.000393 |
---------------------------------
---------------------------------
| explained_variance | 0.201    |
| fps                | 928      |
| nupdates           | 48800    |
| policy_entropy     | 2.06     |
| total_timesteps    | 244000   |
| value_loss         | 0.000777 |
---------------------------------
---------------------------------
| explained_variance | -0.838   |
| fps                | 928      |
| nupdates           | 48900    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.0581   |
| fps                | 924      |
| nupdates           | 51600    |
| policy_entropy     | 2.01     |
| total_timesteps    | 258000   |
| value_loss         | 0.000165 |
---------------------------------
---------------------------------
| explained_variance | 0.774    |
| fps                | 924      |
| nupdates           | 51700    |
| policy_entropy     | 2.04     |
| total_timesteps    | 258500   |
| value_loss         | 0.000242 |
---------------------------------
---------------------------------
| explained_variance | -0.326   |
| fps                | 924      |
| nupdates           | 51800    |
| policy_entropy     | 2.07     |
| total_timesteps    | 259000   |
| value_loss         | 0.000393 |
---------------------------------
---------------------------------
| explained_variance | -0.835   |
| fps                | 924      |
| nupdates           | 51900    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.464    |
| fps                | 930      |
| nupdates           | 54700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 273500   |
| value_loss         | 0.000244 |
---------------------------------
----------------------------------
| explained_variance | -1.28e+04 |
| fps                | 930       |
| nupdates           | 54800     |
| policy_entropy     | 2.07      |
| total_timesteps    | 274000    |
| value_loss         | 0.146     |
----------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 930      |
| nupdates           | 54900    |
| policy_entropy     | 2.06     |
| total_timesteps    | 274500   |
| value_loss         | 0.000122 |
---------------------------------
Eval num_timesteps=275000, episode_reward=-4.70 +/- 0.46
Episode length: 564.20 +/- 80.02
---------------------------------
| explained_variance | -16.8    |
| fps             

---------------------------------
| explained_variance | 0.849    |
| fps                | 925      |
| nupdates           | 57700    |
| policy_entropy     | 2.02     |
| total_timesteps    | 288500   |
| value_loss         | 0.000467 |
---------------------------------
---------------------------------
| explained_variance | 0.077    |
| fps                | 925      |
| nupdates           | 57800    |
| policy_entropy     | 2        |
| total_timesteps    | 289000   |
| value_loss         | 0.000703 |
---------------------------------
---------------------------------
| explained_variance | -3.25    |
| fps                | 925      |
| nupdates           | 57900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 289500   |
| value_loss         | 8.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -84.9    |
| fps                | 925      |
| nupdates           | 58000    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.683    |
| fps                | 921      |
| nupdates           | 60700    |
| policy_entropy     | 2.06     |
| total_timesteps    | 303500   |
| value_loss         | 2.7e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.0626   |
| fps                | 921      |
| nupdates           | 60800    |
| policy_entropy     | 2.06     |
| total_timesteps    | 304000   |
| value_loss         | 4.64e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.04    |
| fps                | 922      |
| nupdates           | 60900    |
| policy_entropy     | 2.05     |
| total_timesteps    | 304500   |
| value_loss         | 0.000892 |
---------------------------------
---------------------------------
| explained_variance | -12      |
| fps                | 922      |
| nupdates           | 61000    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0609   |
| fps                | 927      |
| nupdates           | 63800    |
| policy_entropy     | 2.07     |
| total_timesteps    | 319000   |
| value_loss         | 0.000254 |
---------------------------------
---------------------------------
| explained_variance | -1.98    |
| fps                | 927      |
| nupdates           | 63900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 319500   |
| value_loss         | 0.000549 |
---------------------------------
---------------------------------
| explained_variance | -0.457   |
| fps                | 927      |
| nupdates           | 64000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 320000   |
| value_loss         | 0.000401 |
---------------------------------
---------------------------------
| explained_variance | 0.85     |
| fps                | 927      |
| nupdates           | 64100    |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -3.93    |
| fps                | 923      |
| nupdates           | 66800    |
| policy_entropy     | 2.07     |
| total_timesteps    | 334000   |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | -4.17    |
| fps                | 923      |
| nupdates           | 66900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 334500   |
| value_loss         | 0.000976 |
---------------------------------
---------------------------------
| explained_variance | -4.2     |
| fps                | 923      |
| nupdates           | 67000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 335000   |
| value_loss         | 0.000426 |
---------------------------------
---------------------------------
| explained_variance | 0.903    |
| fps                | 923      |
| nupdates           | 67100    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.685    |
| fps                | 929      |
| nupdates           | 69900    |
| policy_entropy     | 2.05     |
| total_timesteps    | 349500   |
| value_loss         | 0.942    |
---------------------------------
Eval num_timesteps=350000, episode_reward=-4.90 +/- 0.30
Episode length: 553.30 +/- 133.57
---------------------------------
| explained_variance | -7.39    |
| fps                | 921      |
| nupdates           | 70000    |
| policy_entropy     | 2.05     |
| total_timesteps    | 350000   |
| value_loss         | 0.000524 |
---------------------------------
---------------------------------
| explained_variance | 0.746    |
| fps                | 921      |
| nupdates           | 70100    |
| policy_entropy     | 2.06     |
| total_timesteps    | 350500   |
| value_loss         | 6.13e-06 |
---------------------------------
---------------------------------
| explained_variance | -724     |
| fps                | 92

---------------------------------
| explained_variance | -13.1    |
| fps                | 926      |
| nupdates           | 72900    |
| policy_entropy     | 2.04     |
| total_timesteps    | 364500   |
| value_loss         | 0.00059  |
---------------------------------
---------------------------------
| explained_variance | -1.2     |
| fps                | 926      |
| nupdates           | 73000    |
| policy_entropy     | 2.03     |
| total_timesteps    | 365000   |
| value_loss         | 0.00183  |
---------------------------------
---------------------------------
| explained_variance | -15      |
| fps                | 926      |
| nupdates           | 73100    |
| policy_entropy     | 2.07     |
| total_timesteps    | 365500   |
| value_loss         | 0.000623 |
---------------------------------
---------------------------------
| explained_variance | 0.757    |
| fps                | 926      |
| nupdates           | 73200    |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.165    |
| fps                | 921      |
| nupdates           | 75900    |
| policy_entropy     | 2.07     |
| total_timesteps    | 379500   |
| value_loss         | 6.16e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.23    |
| fps                | 921      |
| nupdates           | 76000    |
| policy_entropy     | 2.04     |
| total_timesteps    | 380000   |
| value_loss         | 0.000495 |
---------------------------------
---------------------------------
| explained_variance | 0.355    |
| fps                | 922      |
| nupdates           | 76100    |
| policy_entropy     | 2.01     |
| total_timesteps    | 380500   |
| value_loss         | 0.1      |
---------------------------------
---------------------------------
| explained_variance | -0.608   |
| fps                | 922      |
| nupdates           | 76200    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.0188  |
| fps                | 925      |
| nupdates           | 79000    |
| policy_entropy     | 2.06     |
| total_timesteps    | 395000   |
| value_loss         | 0.201    |
---------------------------------
---------------------------------
| explained_variance | 0.85     |
| fps                | 926      |
| nupdates           | 79100    |
| policy_entropy     | 2.06     |
| total_timesteps    | 395500   |
| value_loss         | 3.21e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 926      |
| nupdates           | 79200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 396000   |
| value_loss         | 8.08e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.759    |
| fps                | 926      |
| nupdates           | 79300    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.783    |
| fps                | 924      |
| nupdates           | 82000    |
| policy_entropy     | 2.07     |
| total_timesteps    | 410000   |
| value_loss         | 9.34e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.586    |
| fps                | 924      |
| nupdates           | 82100    |
| policy_entropy     | 2.06     |
| total_timesteps    | 410500   |
| value_loss         | 7.69e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.987   |
| fps                | 924      |
| nupdates           | 82200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 411000   |
| value_loss         | 0.000174 |
---------------------------------
---------------------------------
| explained_variance | -0.644   |
| fps                | 924      |
| nupdates           | 82300    |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.36     |
| fps                | 922      |
| nupdates           | 85100    |
| policy_entropy     | 2.07     |
| total_timesteps    | 425500   |
| value_loss         | 8.99e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.09    |
| fps                | 922      |
| nupdates           | 85200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 426000   |
| value_loss         | 0.000987 |
---------------------------------
---------------------------------
| explained_variance | 0.994    |
| fps                | 922      |
| nupdates           | 85300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 426500   |
| value_loss         | 0.000855 |
---------------------------------
---------------------------------
| explained_variance | -4.65    |
| fps                | 922      |
| nupdates           | 85400    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.801    |
| fps                | 926      |
| nupdates           | 88200    |
| policy_entropy     | 2.07     |
| total_timesteps    | 441000   |
| value_loss         | 0.00097  |
---------------------------------
---------------------------------
| explained_variance | -0.766   |
| fps                | 926      |
| nupdates           | 88300    |
| policy_entropy     | 2.06     |
| total_timesteps    | 441500   |
| value_loss         | 0.000331 |
---------------------------------
---------------------------------
| explained_variance | 0.746    |
| fps                | 926      |
| nupdates           | 88400    |
| policy_entropy     | 2.06     |
| total_timesteps    | 442000   |
| value_loss         | 0.000154 |
---------------------------------
---------------------------------
| explained_variance | 0.66     |
| fps                | 926      |
| nupdates           | 88500    |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.495    |
| fps                | 923      |
| nupdates           | 91200    |
| policy_entropy     | 2.06     |
| total_timesteps    | 456000   |
| value_loss         | 5.25e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.9     |
| fps                | 923      |
| nupdates           | 91300    |
| policy_entropy     | 2.06     |
| total_timesteps    | 456500   |
| value_loss         | 0.00145  |
---------------------------------
---------------------------------
| explained_variance | 0.386    |
| fps                | 923      |
| nupdates           | 91400    |
| policy_entropy     | 2.07     |
| total_timesteps    | 457000   |
| value_loss         | 0.146    |
---------------------------------
---------------------------------
| explained_variance | 0.897    |
| fps                | 924      |
| nupdates           | 91500    |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.674    |
| fps                | 928      |
| nupdates           | 94300    |
| policy_entropy     | 2.07     |
| total_timesteps    | 471500   |
| value_loss         | 4.8e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 928      |
| nupdates           | 94400    |
| policy_entropy     | 2.07     |
| total_timesteps    | 472000   |
| value_loss         | 0.00328  |
---------------------------------
---------------------------------
| explained_variance | 0.529    |
| fps                | 928      |
| nupdates           | 94500    |
| policy_entropy     | 2.06     |
| total_timesteps    | 472500   |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.709    |
| fps                | 928      |
| nupdates           | 94600    |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.542   |
| fps                | 927      |
| nupdates           | 97300    |
| policy_entropy     | 2.06     |
| total_timesteps    | 486500   |
| value_loss         | 0.00061  |
---------------------------------
---------------------------------
| explained_variance | -0.908   |
| fps                | 927      |
| nupdates           | 97400    |
| policy_entropy     | 2.03     |
| total_timesteps    | 487000   |
| value_loss         | 0.00126  |
---------------------------------
---------------------------------
| explained_variance | -10.5    |
| fps                | 927      |
| nupdates           | 97500    |
| policy_entropy     | 2.08     |
| total_timesteps    | 487500   |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | 0.783    |
| fps                | 927      |
| nupdates           | 97600    |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -4.02    |
| fps                | 924      |
| nupdates           | 100300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 501500   |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | -3.05    |
| fps                | 925      |
| nupdates           | 100400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 502000   |
| value_loss         | 0.00105  |
---------------------------------
---------------------------------
| explained_variance | -4.82    |
| fps                | 925      |
| nupdates           | 100500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 502500   |
| value_loss         | 0.000367 |
---------------------------------
---------------------------------
| explained_variance | 0.00749  |
| fps                | 925      |
| nupdates           | 100600   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.799   |
| fps                | 929      |
| nupdates           | 103400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 517000   |
| value_loss         | 5.28e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.307   |
| fps                | 929      |
| nupdates           | 103500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 517500   |
| value_loss         | 0.000357 |
---------------------------------
---------------------------------
| explained_variance | 0.355    |
| fps                | 929      |
| nupdates           | 103600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 518000   |
| value_loss         | 0.000154 |
---------------------------------
---------------------------------
| explained_variance | 0.512    |
| fps                | 929      |
| nupdates           | 103700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -50.9    |
| fps                | 927      |
| nupdates           | 106400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 532000   |
| value_loss         | 0.00585  |
---------------------------------
---------------------------------
| explained_variance | -1.8     |
| fps                | 927      |
| nupdates           | 106500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 532500   |
| value_loss         | 0.000106 |
---------------------------------
---------------------------------
| explained_variance | 0.328    |
| fps                | 927      |
| nupdates           | 106600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 533000   |
| value_loss         | 0.195    |
---------------------------------
---------------------------------
| explained_variance | 0.297    |
| fps                | 928      |
| nupdates           | 106700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.0981   |
| fps                | 931      |
| nupdates           | 109500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 547500   |
| value_loss         | 0.000131 |
---------------------------------
---------------------------------
| explained_variance | 0.652    |
| fps                | 931      |
| nupdates           | 109600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 548000   |
| value_loss         | 0.000221 |
---------------------------------
---------------------------------
| explained_variance | 0.92     |
| fps                | 931      |
| nupdates           | 109700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 548500   |
| value_loss         | 0.00017  |
---------------------------------
---------------------------------
| explained_variance | -2.69    |
| fps                | 931      |
| nupdates           | 109800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.603    |
| fps                | 930      |
| nupdates           | 112500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 562500   |
| value_loss         | 9.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.23     |
| fps                | 930      |
| nupdates           | 112600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 563000   |
| value_loss         | 0.000321 |
---------------------------------
---------------------------------
| explained_variance | 0.433    |
| fps                | 930      |
| nupdates           | 112700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 563500   |
| value_loss         | 7.08e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.657    |
| fps                | 930      |
| nupdates           | 112800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.851    |
| fps                | 928      |
| nupdates           | 115500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 577500   |
| value_loss         | 1.3e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.0894   |
| fps                | 928      |
| nupdates           | 115600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 578000   |
| value_loss         | 0.000365 |
---------------------------------
---------------------------------
| explained_variance | 0.846    |
| fps                | 928      |
| nupdates           | 115700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 578500   |
| value_loss         | 5.2e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.644    |
| fps                | 928      |
| nupdates           | 115800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.889    |
| fps                | 931      |
| nupdates           | 118600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 593000   |
| value_loss         | 8.15e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.6      |
| fps                | 931      |
| nupdates           | 118700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 593500   |
| value_loss         | 0.00017  |
---------------------------------
---------------------------------
| explained_variance | -4.66    |
| fps                | 931      |
| nupdates           | 118800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 594000   |
| value_loss         | 8.19e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.07    |
| fps                | 931      |
| nupdates           | 118900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.756   |
| fps                | 929      |
| nupdates           | 121600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 608000   |
| value_loss         | 0.000774 |
---------------------------------
---------------------------------
| explained_variance | -2.53    |
| fps                | 929      |
| nupdates           | 121700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 608500   |
| value_loss         | 4.64e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.822   |
| fps                | 929      |
| nupdates           | 121800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 609000   |
| value_loss         | 0.00107  |
---------------------------------
---------------------------------
| explained_variance | 0.606    |
| fps                | 929      |
| nupdates           | 121900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.992    |
| fps                | 933      |
| nupdates           | 124700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 623500   |
| value_loss         | 1.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.592    |
| fps                | 933      |
| nupdates           | 124800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 624000   |
| value_loss         | 3.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.216    |
| fps                | 933      |
| nupdates           | 124900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 624500   |
| value_loss         | 0.000246 |
---------------------------------
Eval num_timesteps=625000, episode_reward=-4.90 +/- 0.30
Episode length: 629.70 +/- 85.29
---------------------------------
| explained_variance | 0.554    |
| fps                | 928

---------------------------------
| explained_variance | -9.32    |
| fps                | 931      |
| nupdates           | 127700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 638500   |
| value_loss         | 0.000209 |
---------------------------------
---------------------------------
| explained_variance | 0.0542   |
| fps                | 931      |
| nupdates           | 127800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 639000   |
| value_loss         | 0.000349 |
---------------------------------
---------------------------------
| explained_variance | -0.319   |
| fps                | 931      |
| nupdates           | 127900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 639500   |
| value_loss         | 0.000509 |
---------------------------------
---------------------------------
| explained_variance | 0.0419   |
| fps                | 931      |
| nupdates           | 128000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -3.19    |
| fps                | 929      |
| nupdates           | 130700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 653500   |
| value_loss         | 0.000305 |
---------------------------------
---------------------------------
| explained_variance | 0.89     |
| fps                | 929      |
| nupdates           | 130800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 654000   |
| value_loss         | 3.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.571    |
| fps                | 929      |
| nupdates           | 130900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 654500   |
| value_loss         | 0.000152 |
---------------------------------
---------------------------------
| explained_variance | -2.35    |
| fps                | 929      |
| nupdates           | 131000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -31      |
| fps                | 932      |
| nupdates           | 133800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 669000   |
| value_loss         | 0.00197  |
---------------------------------
---------------------------------
| explained_variance | 0.95     |
| fps                | 932      |
| nupdates           | 133900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 669500   |
| value_loss         | 1.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.948    |
| fps                | 932      |
| nupdates           | 134000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 670000   |
| value_loss         | 5.22e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.987    |
| fps                | 932      |
| nupdates           | 134100   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -1.91    |
| fps                | 930      |
| nupdates           | 136800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 684000   |
| value_loss         | 0.000186 |
---------------------------------
---------------------------------
| explained_variance | 0.771    |
| fps                | 930      |
| nupdates           | 136900   |
| policy_entropy     | 2.02     |
| total_timesteps    | 684500   |
| value_loss         | 0.00193  |
---------------------------------
---------------------------------
| explained_variance | 0.949    |
| fps                | 931      |
| nupdates           | 137000   |
| policy_entropy     | 1.99     |
| total_timesteps    | 685000   |
| value_loss         | 2.08e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.333   |
| fps                | 931      |
| nupdates           | 137100   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.766   |
| fps                | 933      |
| nupdates           | 139900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 699500   |
| value_loss         | 0.00018  |
---------------------------------
Eval num_timesteps=700000, episode_reward=-4.90 +/- 0.30
Episode length: 598.00 +/- 111.90
---------------------------------
| explained_variance | 0.201    |
| fps                | 929      |
| nupdates           | 140000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 700000   |
| value_loss         | 0.000495 |
---------------------------------
---------------------------------
| explained_variance | -0.147   |
| fps                | 929      |
| nupdates           | 140100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 700500   |
| value_loss         | 0.000215 |
---------------------------------
---------------------------------
| explained_variance | 0.917    |
| fps                | 92

---------------------------------
| explained_variance | -5.24    |
| fps                | 932      |
| nupdates           | 142900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 714500   |
| value_loss         | 0.0012   |
---------------------------------
---------------------------------
| explained_variance | 0.477    |
| fps                | 932      |
| nupdates           | 143000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 715000   |
| value_loss         | 9.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0367   |
| fps                | 932      |
| nupdates           | 143100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 715500   |
| value_loss         | 0.000181 |
---------------------------------
---------------------------------
| explained_variance | -1.22    |
| fps                | 932      |
| nupdates           | 143200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -11.4    |
| fps                | 931      |
| nupdates           | 145900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 729500   |
| value_loss         | 0.00115  |
---------------------------------
---------------------------------
| explained_variance | -1.93    |
| fps                | 931      |
| nupdates           | 146000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 730000   |
| value_loss         | 1.36e-05 |
---------------------------------
---------------------------------
| explained_variance | -14.6    |
| fps                | 932      |
| nupdates           | 146100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 730500   |
| value_loss         | 0.000198 |
---------------------------------
---------------------------------
| explained_variance | 0.0294   |
| fps                | 932      |
| nupdates           | 146200   |
| policy_entropy     | 1.98     |
| total_timest

---------------------------------
| explained_variance | -7.02    |
| fps                | 934      |
| nupdates           | 149000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 745000   |
| value_loss         | 0.00117  |
---------------------------------
---------------------------------
| explained_variance | -1.52    |
| fps                | 934      |
| nupdates           | 149100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 745500   |
| value_loss         | 0.00181  |
---------------------------------
---------------------------------
| explained_variance | 0.0541   |
| fps                | 934      |
| nupdates           | 149200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 746000   |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.437    |
| fps                | 934      |
| nupdates           | 149300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.623    |
| fps                | 932      |
| nupdates           | 152000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 760000   |
| value_loss         | 9.88e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0183  |
| fps                | 933      |
| nupdates           | 152100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 760500   |
| value_loss         | 0.0001   |
---------------------------------
---------------------------------
| explained_variance | 0.437    |
| fps                | 933      |
| nupdates           | 152200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 761000   |
| value_loss         | 0.000137 |
---------------------------------
---------------------------------
| explained_variance | 0.889    |
| fps                | 933      |
| nupdates           | 152300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.613    |
| fps                | 931      |
| nupdates           | 155100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 775500   |
| value_loss         | 1e-05    |
---------------------------------
---------------------------------
| explained_variance | -2.41    |
| fps                | 932      |
| nupdates           | 155200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 776000   |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | 0.24     |
| fps                | 932      |
| nupdates           | 155300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 776500   |
| value_loss         | 5.74e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 932      |
| nupdates           | 155400   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.678    |
| fps                | 934      |
| nupdates           | 158200   |
| policy_entropy     | 2.08     |
| total_timesteps    | 791000   |
| value_loss         | 0.000864 |
---------------------------------
---------------------------------
| explained_variance | -11      |
| fps                | 934      |
| nupdates           | 158300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 791500   |
| value_loss         | 0.000432 |
---------------------------------
---------------------------------
| explained_variance | 0.845    |
| fps                | 934      |
| nupdates           | 158400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 792000   |
| value_loss         | 3.02e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.29    |
| fps                | 934      |
| nupdates           | 158500   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.921    |
| fps                | 933      |
| nupdates           | 161200   |
| policy_entropy     | 1.73     |
| total_timesteps    | 806000   |
| value_loss         | 0.955    |
---------------------------------
---------------------------------
| explained_variance | -1.56    |
| fps                | 933      |
| nupdates           | 161300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 806500   |
| value_loss         | 9.01e-05 |
---------------------------------
---------------------------------
| explained_variance | -6.23    |
| fps                | 934      |
| nupdates           | 161400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 807000   |
| value_loss         | 0.0158   |
---------------------------------
---------------------------------
| explained_variance | 0.822    |
| fps                | 934      |
| nupdates           | 161500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.698    |
| fps                | 936      |
| nupdates           | 164300   |
| policy_entropy     | 2.03     |
| total_timesteps    | 821500   |
| value_loss         | 0.000154 |
---------------------------------
----------------------------------
| explained_variance | -2.59e+03 |
| fps                | 936       |
| nupdates           | 164400    |
| policy_entropy     | 2.06      |
| total_timesteps    | 822000    |
| value_loss         | 0.0843    |
----------------------------------
---------------------------------
| explained_variance | 0.35     |
| fps                | 936      |
| nupdates           | 164500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 822500   |
| value_loss         | 0.000285 |
---------------------------------
---------------------------------
| explained_variance | -0.867   |
| fps                | 936      |
| nupdates           | 164600   |
| policy_entropy     | 2.07     |
| tota

---------------------------------
| explained_variance | -0.104   |
| fps                | 934      |
| nupdates           | 167300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 836500   |
| value_loss         | 0.000349 |
---------------------------------
---------------------------------
| explained_variance | 0.793    |
| fps                | 934      |
| nupdates           | 167400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 837000   |
| value_loss         | 7.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.289   |
| fps                | 934      |
| nupdates           | 167500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 837500   |
| value_loss         | 0.000172 |
---------------------------------
---------------------------------
| explained_variance | 0.142    |
| fps                | 934      |
| nupdates           | 167600   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.35    |
| fps                | 933      |
| nupdates           | 170300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 851500   |
| value_loss         | 0.00151  |
---------------------------------
---------------------------------
| explained_variance | -2.48    |
| fps                | 933      |
| nupdates           | 170400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 852000   |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | 0.0887   |
| fps                | 933      |
| nupdates           | 170500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 852500   |
| value_loss         | 0.000282 |
---------------------------------
---------------------------------
| explained_variance | -0.169   |
| fps                | 933      |
| nupdates           | 170600   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -0.523   |
| fps                | 935      |
| nupdates           | 173400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 867000   |
| value_loss         | 4.34e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.37    |
| fps                | 935      |
| nupdates           | 173500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 867500   |
| value_loss         | 0.00184  |
---------------------------------
---------------------------------
| explained_variance | -2.14    |
| fps                | 935      |
| nupdates           | 173600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 868000   |
| value_loss         | 0.000771 |
---------------------------------
---------------------------------
| explained_variance | 0.163    |
| fps                | 935      |
| nupdates           | 173700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -6.36    |
| fps                | 933      |
| nupdates           | 176400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 882000   |
| value_loss         | 0.00108  |
---------------------------------
---------------------------------
| explained_variance | 0.939    |
| fps                | 933      |
| nupdates           | 176500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 882500   |
| value_loss         | 2.46e-05 |
---------------------------------
---------------------------------
| explained_variance | -34.2    |
| fps                | 934      |
| nupdates           | 176600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 883000   |
| value_loss         | 0.00155  |
---------------------------------
---------------------------------
| explained_variance | -0.0322  |
| fps                | 934      |
| nupdates           | 176700   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -6.48    |
| fps                | 936      |
| nupdates           | 179500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 897500   |
| value_loss         | 8.4e-05  |
---------------------------------
---------------------------------
| explained_variance | -11.8    |
| fps                | 936      |
| nupdates           | 179600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 898000   |
| value_loss         | 0.000193 |
---------------------------------
---------------------------------
| explained_variance | 0.392    |
| fps                | 936      |
| nupdates           | 179700   |
| policy_entropy     | 1.98     |
| total_timesteps    | 898500   |
| value_loss         | 0.157    |
---------------------------------
---------------------------------
| explained_variance | 0.592    |
| fps                | 936      |
| nupdates           | 179800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.606    |
| fps                | 935      |
| nupdates           | 182500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 912500   |
| value_loss         | 7.7e-05  |
---------------------------------
---------------------------------
| explained_variance | -1.46    |
| fps                | 935      |
| nupdates           | 182600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 913000   |
| value_loss         | 0.000197 |
---------------------------------
---------------------------------
| explained_variance | -2.23    |
| fps                | 935      |
| nupdates           | 182700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 913500   |
| value_loss         | 0.000165 |
---------------------------------
---------------------------------
| explained_variance | 0.354    |
| fps                | 935      |
| nupdates           | 182800   |
| policy_entropy     | 1.98     |
| total_timest

---------------------------------
| explained_variance | 0.786    |
| fps                | 934      |
| nupdates           | 185500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 927500   |
| value_loss         | 0.000101 |
---------------------------------
---------------------------------
| explained_variance | -0.0837  |
| fps                | 934      |
| nupdates           | 185600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 928000   |
| value_loss         | 0.000448 |
---------------------------------
---------------------------------
| explained_variance | 0.44     |
| fps                | 934      |
| nupdates           | 185700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 928500   |
| value_loss         | 0.00055  |
---------------------------------
---------------------------------
| explained_variance | -2.62    |
| fps                | 934      |
| nupdates           | 185800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.819    |
| fps                | 936      |
| nupdates           | 188600   |
| policy_entropy     | 2        |
| total_timesteps    | 943000   |
| value_loss         | 6.79e-05 |
---------------------------------
---------------------------------
| explained_variance | -1e+03   |
| fps                | 936      |
| nupdates           | 188700   |
| policy_entropy     | 2.05     |
| total_timesteps    | 943500   |
| value_loss         | 0.0754   |
---------------------------------
---------------------------------
| explained_variance | 0.748    |
| fps                | 936      |
| nupdates           | 188800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 944000   |
| value_loss         | 0.000683 |
---------------------------------
---------------------------------
| explained_variance | -0.406   |
| fps                | 936      |
| nupdates           | 188900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -1.18    |
| fps                | 935      |
| nupdates           | 191600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 958000   |
| value_loss         | 0.000568 |
---------------------------------
---------------------------------
| explained_variance | 0.326    |
| fps                | 935      |
| nupdates           | 191700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 958500   |
| value_loss         | 7.46e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.02    |
| fps                | 935      |
| nupdates           | 191800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 959000   |
| value_loss         | 7.48e-05 |
---------------------------------
---------------------------------
| explained_variance | -969     |
| fps                | 935      |
| nupdates           | 191900   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.696    |
| fps                | 937      |
| nupdates           | 194700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 973500   |
| value_loss         | 7.55e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.313    |
| fps                | 937      |
| nupdates           | 194800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 974000   |
| value_loss         | 2.36e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.196    |
| fps                | 937      |
| nupdates           | 194900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 974500   |
| value_loss         | 0.000476 |
---------------------------------
Eval num_timesteps=975000, episode_reward=-4.70 +/- 0.46
Episode length: 607.30 +/- 154.23
---------------------------------
| explained_variance | 0.605    |
| fps                | 93

---------------------------------
| explained_variance | -0.156   |
| fps                | 936      |
| nupdates           | 197700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 988500   |
| value_loss         | 0.000267 |
---------------------------------
---------------------------------
| explained_variance | -2.58    |
| fps                | 936      |
| nupdates           | 197800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 989000   |
| value_loss         | 0.000616 |
---------------------------------
---------------------------------
| explained_variance | -1.13    |
| fps                | 936      |
| nupdates           | 197900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 989500   |
| value_loss         | 0.000134 |
---------------------------------
---------------------------------
| explained_variance | -0.436   |
| fps                | 937      |
| nupdates           | 198000   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -32.8    |
| fps                | 936      |
| nupdates           | 200700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1003500  |
| value_loss         | 0.00131  |
---------------------------------
---------------------------------
| explained_variance | 0.66     |
| fps                | 936      |
| nupdates           | 200800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1004000  |
| value_loss         | 8e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.907    |
| fps                | 936      |
| nupdates           | 200900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1004500  |
| value_loss         | 1.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.339    |
| fps                | 936      |
| nupdates           | 201000   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.156   |
| fps                | 938      |
| nupdates           | 203800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1019000  |
| value_loss         | 8.07e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.278    |
| fps                | 938      |
| nupdates           | 203900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1019500  |
| value_loss         | 6.34e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.55    |
| fps                | 938      |
| nupdates           | 204000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1020000  |
| value_loss         | 0.000319 |
---------------------------------
---------------------------------
| explained_variance | 0.737    |
| fps                | 938      |
| nupdates           | 204100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -4.09    |
| fps                | 937      |
| nupdates           | 206800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1034000  |
| value_loss         | 0.00222  |
---------------------------------
---------------------------------
| explained_variance | -0.842   |
| fps                | 937      |
| nupdates           | 206900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1034500  |
| value_loss         | 0.000264 |
---------------------------------
---------------------------------
| explained_variance | 0.586    |
| fps                | 937      |
| nupdates           | 207000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1035000  |
| value_loss         | 3.47e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.345    |
| fps                | 937      |
| nupdates           | 207100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.159    |
| fps                | 939      |
| nupdates           | 209900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1049500  |
| value_loss         | 0.000762 |
---------------------------------
Eval num_timesteps=1050000, episode_reward=-4.60 +/- 0.66
Episode length: 612.20 +/- 67.48
---------------------------------
| explained_variance | 0.799    |
| fps                | 936      |
| nupdates           | 210000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1050000  |
| value_loss         | 3.39e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.774    |
| fps                | 936      |
| nupdates           | 210100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1050500  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | -20.9    |
| fps                | 93

---------------------------------
| explained_variance | 0.982    |
| fps                | 937      |
| nupdates           | 212900   |
| policy_entropy     | 2        |
| total_timesteps    | 1064500  |
| value_loss         | 3.49e-05 |
---------------------------------
---------------------------------
| explained_variance | -208     |
| fps                | 937      |
| nupdates           | 213000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1065000  |
| value_loss         | 0.0442   |
---------------------------------
---------------------------------
| explained_variance | -1.33    |
| fps                | 937      |
| nupdates           | 213100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1065500  |
| value_loss         | 4.12e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.274    |
| fps                | 937      |
| nupdates           | 213200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.19    |
| fps                | 934      |
| nupdates           | 215900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1079500  |
| value_loss         | 0.00156  |
---------------------------------
---------------------------------
| explained_variance | -19      |
| fps                | 934      |
| nupdates           | 216000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1080000  |
| value_loss         | 0.00106  |
---------------------------------
---------------------------------
| explained_variance | -0.247   |
| fps                | 934      |
| nupdates           | 216100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1080500  |
| value_loss         | 0.000374 |
---------------------------------
---------------------------------
| explained_variance | 0.766    |
| fps                | 934      |
| nupdates           | 216200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -196     |
| fps                | 935      |
| nupdates           | 219000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1095000  |
| value_loss         | 0.00499  |
---------------------------------
---------------------------------
| explained_variance | -2.79    |
| fps                | 935      |
| nupdates           | 219100   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1095500  |
| value_loss         | 0.00189  |
---------------------------------
---------------------------------
| explained_variance | -10.7    |
| fps                | 935      |
| nupdates           | 219200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1096000  |
| value_loss         | 0.00025  |
---------------------------------
---------------------------------
| explained_variance | 0.988    |
| fps                | 935      |
| nupdates           | 219300   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | -3.91    |
| fps                | 932      |
| nupdates           | 222000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1110000  |
| value_loss         | 7.25e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.46    |
| fps                | 932      |
| nupdates           | 222100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1110500  |
| value_loss         | 0.000765 |
---------------------------------
---------------------------------
| explained_variance | 0.653    |
| fps                | 932      |
| nupdates           | 222200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1111000  |
| value_loss         | 0.000221 |
---------------------------------
---------------------------------
| explained_variance | 0.653    |
| fps                | 932      |
| nupdates           | 222300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.66    |
| fps                | 930      |
| nupdates           | 225100   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1125500  |
| value_loss         | 0.00127  |
---------------------------------
---------------------------------
| explained_variance | -7.26    |
| fps                | 931      |
| nupdates           | 225200   |
| policy_entropy     | 1.99     |
| total_timesteps    | 1126000  |
| value_loss         | 0.00296  |
---------------------------------
---------------------------------
| explained_variance | 0.168    |
| fps                | 931      |
| nupdates           | 225300   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1126500  |
| value_loss         | 0.000412 |
---------------------------------
---------------------------------
| explained_variance | -5.08    |
| fps                | 931      |
| nupdates           | 225400   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.984    |
| fps                | 932      |
| nupdates           | 228200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1141000  |
| value_loss         | 1.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.99    |
| fps                | 932      |
| nupdates           | 228300   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1141500  |
| value_loss         | 0.000123 |
---------------------------------
---------------------------------
| explained_variance | 0.735    |
| fps                | 932      |
| nupdates           | 228400   |
| policy_entropy     | 1.88     |
| total_timesteps    | 1142000  |
| value_loss         | 0.000288 |
---------------------------------
---------------------------------
| explained_variance | 0.264    |
| fps                | 932      |
| nupdates           | 228500   |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | 0.691    |
| fps                | 929      |
| nupdates           | 231200   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1156000  |
| value_loss         | 4.72e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.67    |
| fps                | 930      |
| nupdates           | 231300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1156500  |
| value_loss         | 0.000137 |
---------------------------------
---------------------------------
| explained_variance | -2.65    |
| fps                | 930      |
| nupdates           | 231400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1157000  |
| value_loss         | 0.000332 |
---------------------------------
---------------------------------
| explained_variance | -2.67    |
| fps                | 930      |
| nupdates           | 231500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.567    |
| fps                | 930      |
| nupdates           | 234300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1171500  |
| value_loss         | 2.77e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.773   |
| fps                | 930      |
| nupdates           | 234400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1172000  |
| value_loss         | 6.05e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.417    |
| fps                | 930      |
| nupdates           | 234500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1172500  |
| value_loss         | 2.38e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.58    |
| fps                | 930      |
| nupdates           | 234600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.505    |
| fps                | 928      |
| nupdates           | 237300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1186500  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.849    |
| fps                | 928      |
| nupdates           | 237400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1187000  |
| value_loss         | 0.000522 |
---------------------------------
---------------------------------
| explained_variance | 0.274    |
| fps                | 928      |
| nupdates           | 237500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1187500  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | 0.536    |
| fps                | 928      |
| nupdates           | 237600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.0312  |
| fps                | 926      |
| nupdates           | 240300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1201500  |
| value_loss         | 0.000536 |
---------------------------------
---------------------------------
| explained_variance | -2.17    |
| fps                | 926      |
| nupdates           | 240400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1202000  |
| value_loss         | 5.47e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.39    |
| fps                | 926      |
| nupdates           | 240500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1202500  |
| value_loss         | 0.000667 |
---------------------------------
---------------------------------
| explained_variance | 0.742    |
| fps                | 926      |
| nupdates           | 240600   |
| policy_entropy     | 1.99     |
| total_timest

---------------------------------
| explained_variance | -2.61    |
| fps                | 927      |
| nupdates           | 243400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1217000  |
| value_loss         | 0.000616 |
---------------------------------
---------------------------------
| explained_variance | 0.809    |
| fps                | 927      |
| nupdates           | 243500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1217500  |
| value_loss         | 0.000193 |
---------------------------------
---------------------------------
| explained_variance | -1.47    |
| fps                | 927      |
| nupdates           | 243600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1218000  |
| value_loss         | 0.000158 |
---------------------------------
---------------------------------
| explained_variance | -0.0178  |
| fps                | 927      |
| nupdates           | 243700   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -1.52    |
| fps                | 926      |
| nupdates           | 246400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1232000  |
| value_loss         | 0.000901 |
---------------------------------
---------------------------------
| explained_variance | -0.649   |
| fps                | 926      |
| nupdates           | 246500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1232500  |
| value_loss         | 0.000112 |
---------------------------------
---------------------------------
| explained_variance | 0.159    |
| fps                | 926      |
| nupdates           | 246600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1233000  |
| value_loss         | 0.00121  |
---------------------------------
---------------------------------
| explained_variance | 0.527    |
| fps                | 926      |
| nupdates           | 246700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -5.06    |
| fps                | 927      |
| nupdates           | 249500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1247500  |
| value_loss         | 0.00112  |
---------------------------------
---------------------------------
| explained_variance | 0.336    |
| fps                | 927      |
| nupdates           | 249600   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1248000  |
| value_loss         | 0.104    |
---------------------------------
---------------------------------
| explained_variance | 0.913    |
| fps                | 927      |
| nupdates           | 249700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1248500  |
| value_loss         | 5.83e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0762   |
| fps                | 927      |
| nupdates           | 249800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.305   |
| fps                | 926      |
| nupdates           | 252500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1262500  |
| value_loss         | 7.48e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.388    |
| fps                | 927      |
| nupdates           | 252600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1263000  |
| value_loss         | 0.000118 |
---------------------------------
---------------------------------
| explained_variance | -0.595   |
| fps                | 927      |
| nupdates           | 252700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1263500  |
| value_loss         | 9.75e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.898    |
| fps                | 927      |
| nupdates           | 252800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.426    |
| fps                | 925      |
| nupdates           | 255500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1277500  |
| value_loss         | 0.000729 |
---------------------------------
---------------------------------
| explained_variance | 0.0752   |
| fps                | 925      |
| nupdates           | 255600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1278000  |
| value_loss         | 0.000285 |
---------------------------------
---------------------------------
| explained_variance | 0.98     |
| fps                | 925      |
| nupdates           | 255700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1278500  |
| value_loss         | 0.000167 |
---------------------------------
---------------------------------
| explained_variance | 0.428    |
| fps                | 925      |
| nupdates           | 255800   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.0388   |
| fps                | 926      |
| nupdates           | 258600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1293000  |
| value_loss         | 3.55e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.919    |
| fps                | 926      |
| nupdates           | 258700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1293500  |
| value_loss         | 5.44e-05 |
---------------------------------
---------------------------------
| explained_variance | -20.1    |
| fps                | 926      |
| nupdates           | 258800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1294000  |
| value_loss         | 0.000113 |
---------------------------------
---------------------------------
| explained_variance | -24.4    |
| fps                | 926      |
| nupdates           | 258900   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.462    |
| fps                | 925      |
| nupdates           | 261600   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1308000  |
| value_loss         | 0.000323 |
---------------------------------
---------------------------------
| explained_variance | -0.803   |
| fps                | 925      |
| nupdates           | 261700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1308500  |
| value_loss         | 0.000372 |
---------------------------------
---------------------------------
| explained_variance | 0.546    |
| fps                | 925      |
| nupdates           | 261800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1309000  |
| value_loss         | 6.67e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.72    |
| fps                | 925      |
| nupdates           | 261900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.92     |
| fps                | 925      |
| nupdates           | 264700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1323500  |
| value_loss         | 0.000174 |
---------------------------------
---------------------------------
| explained_variance | -0.0631  |
| fps                | 925      |
| nupdates           | 264800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1324000  |
| value_loss         | 2.56e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.41    |
| fps                | 925      |
| nupdates           | 264900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1324500  |
| value_loss         | 6.39e-05 |
---------------------------------
Eval num_timesteps=1325000, episode_reward=-5.00 +/- 0.00
Episode length: 536.50 +/- 80.40
---------------------------------
| explained_variance | 0.967    |
| fps                | 92

---------------------------------
| explained_variance | 0.657    |
| fps                | 924      |
| nupdates           | 267700   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1338500  |
| value_loss         | 0.000941 |
---------------------------------
---------------------------------
| explained_variance | -0.194   |
| fps                | 924      |
| nupdates           | 267800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1339000  |
| value_loss         | 0.000258 |
---------------------------------
---------------------------------
| explained_variance | -4.09    |
| fps                | 924      |
| nupdates           | 267900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1339500  |
| value_loss         | 0.000147 |
---------------------------------
---------------------------------
| explained_variance | -0.743   |
| fps                | 924      |
| nupdates           | 268000   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | 0.909    |
| fps                | 923      |
| nupdates           | 270700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1353500  |
| value_loss         | 2.38e-06 |
---------------------------------
---------------------------------
| explained_variance | -10.4    |
| fps                | 923      |
| nupdates           | 270800   |
| policy_entropy     | 2.01     |
| total_timesteps    | 1354000  |
| value_loss         | 0.00084  |
---------------------------------
---------------------------------
| explained_variance | 0.803    |
| fps                | 923      |
| nupdates           | 270900   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1354500  |
| value_loss         | 0.000455 |
---------------------------------
---------------------------------
| explained_variance | 0.189    |
| fps                | 923      |
| nupdates           | 271000   |
| policy_entropy     | 2.02     |
| total_timest

---------------------------------
| explained_variance | 0.895    |
| fps                | 924      |
| nupdates           | 273800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1369000  |
| value_loss         | 0.000532 |
---------------------------------
---------------------------------
| explained_variance | 0.989    |
| fps                | 924      |
| nupdates           | 273900   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1369500  |
| value_loss         | 5.75e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.65    |
| fps                | 924      |
| nupdates           | 274000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1370000  |
| value_loss         | 0.00162  |
---------------------------------
---------------------------------
| explained_variance | 0.353    |
| fps                | 924      |
| nupdates           | 274100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -3.94    |
| fps                | 924      |
| nupdates           | 276800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1384000  |
| value_loss         | 3e-05    |
---------------------------------
---------------------------------
| explained_variance | 0.439    |
| fps                | 924      |
| nupdates           | 276900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1384500  |
| value_loss         | 0.000136 |
---------------------------------
---------------------------------
| explained_variance | -0.406   |
| fps                | 924      |
| nupdates           | 277000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1385000  |
| value_loss         | 0.000195 |
---------------------------------
---------------------------------
| explained_variance | -3.38    |
| fps                | 924      |
| nupdates           | 277100   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.414   |
| fps                | 925      |
| nupdates           | 279900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1399500  |
| value_loss         | 0.000433 |
---------------------------------
Eval num_timesteps=1400000, episode_reward=-4.90 +/- 0.30
Episode length: 555.80 +/- 88.60
---------------------------------
| explained_variance | -1.09    |
| fps                | 923      |
| nupdates           | 280000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1400000  |
| value_loss         | 0.000682 |
---------------------------------
---------------------------------
| explained_variance | 0.964    |
| fps                | 923      |
| nupdates           | 280100   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1400500  |
| value_loss         | 8.36e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.702    |
| fps                | 92

---------------------------------
| explained_variance | -5.06    |
| fps                | 924      |
| nupdates           | 282900   |
| policy_entropy     | 1.82     |
| total_timesteps    | 1414500  |
| value_loss         | 0.00243  |
---------------------------------
---------------------------------
| explained_variance | 0.239    |
| fps                | 924      |
| nupdates           | 283000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1415000  |
| value_loss         | 0.145    |
---------------------------------
---------------------------------
| explained_variance | -0.391   |
| fps                | 924      |
| nupdates           | 283100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1415500  |
| value_loss         | 0.000599 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 924      |
| nupdates           | 283200   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.975    |
| fps                | 923      |
| nupdates           | 285900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1429500  |
| value_loss         | 1.98e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.887    |
| fps                | 923      |
| nupdates           | 286000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1430000  |
| value_loss         | 0.000111 |
---------------------------------
---------------------------------
| explained_variance | 0.661    |
| fps                | 923      |
| nupdates           | 286100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1430500  |
| value_loss         | 0.000183 |
---------------------------------
---------------------------------
| explained_variance | 0.618    |
| fps                | 923      |
| nupdates           | 286200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -1.9e+04 |
| fps                | 924      |
| nupdates           | 289000   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1445000  |
| value_loss         | 0.179    |
---------------------------------
---------------------------------
| explained_variance | 0.974    |
| fps                | 924      |
| nupdates           | 289100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1445500  |
| value_loss         | 9.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.23    |
| fps                | 924      |
| nupdates           | 289200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1446000  |
| value_loss         | 0.0142   |
---------------------------------
---------------------------------
| explained_variance | 0.359    |
| fps                | 924      |
| nupdates           | 289300   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.0956   |
| fps                | 922      |
| nupdates           | 292000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1460000  |
| value_loss         | 0.000973 |
---------------------------------
---------------------------------
| explained_variance | 0.161    |
| fps                | 922      |
| nupdates           | 292100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1460500  |
| value_loss         | 7.37e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0343   |
| fps                | 922      |
| nupdates           | 292200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1461000  |
| value_loss         | 3.15e-05 |
---------------------------------
---------------------------------
| explained_variance | -7.98    |
| fps                | 922      |
| nupdates           | 292300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.39     |
| fps                | 920      |
| nupdates           | 295100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1475500  |
| value_loss         | 8.57e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.752    |
| fps                | 920      |
| nupdates           | 295200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1476000  |
| value_loss         | 5.39e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.915    |
| fps                | 920      |
| nupdates           | 295300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1476500  |
| value_loss         | 5.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.34     |
| fps                | 920      |
| nupdates           | 295400   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.945    |
| fps                | 920      |
| nupdates           | 298200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1491000  |
| value_loss         | 0.000112 |
---------------------------------
---------------------------------
| explained_variance | 0.669    |
| fps                | 920      |
| nupdates           | 298300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1491500  |
| value_loss         | 0.000887 |
---------------------------------
---------------------------------
| explained_variance | 0.519    |
| fps                | 920      |
| nupdates           | 298400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1492000  |
| value_loss         | 0.000179 |
---------------------------------
---------------------------------
| explained_variance | 0.37     |
| fps                | 920      |
| nupdates           | 298500   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | -1.26    |
| fps                | 918      |
| nupdates           | 301200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1506000  |
| value_loss         | 0.000267 |
---------------------------------
---------------------------------
| explained_variance | -3.07    |
| fps                | 918      |
| nupdates           | 301300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1506500  |
| value_loss         | 8.14e-05 |
---------------------------------
---------------------------------
| explained_variance | -9.89    |
| fps                | 918      |
| nupdates           | 301400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1507000  |
| value_loss         | 0.00106  |
---------------------------------
---------------------------------
| explained_variance | 0.952    |
| fps                | 918      |
| nupdates           | 301500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.0291  |
| fps                | 917      |
| nupdates           | 304300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1521500  |
| value_loss         | 4.58e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.334    |
| fps                | 917      |
| nupdates           | 304400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1522000  |
| value_loss         | 1.69e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.5      |
| fps                | 917      |
| nupdates           | 304500   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1522500  |
| value_loss         | 4.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.619    |
| fps                | 917      |
| nupdates           | 304600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.174    |
| fps                | 916      |
| nupdates           | 307300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1536500  |
| value_loss         | 2.23e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.794    |
| fps                | 916      |
| nupdates           | 307400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1537000  |
| value_loss         | 3.57e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.65    |
| fps                | 916      |
| nupdates           | 307500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1537500  |
| value_loss         | 7.53e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.455    |
| fps                | 916      |
| nupdates           | 307600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.442   |
| fps                | 915      |
| nupdates           | 310300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1551500  |
| value_loss         | 0.000281 |
---------------------------------
---------------------------------
| explained_variance | 0.28     |
| fps                | 915      |
| nupdates           | 310400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1552000  |
| value_loss         | 8.89e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 915      |
| nupdates           | 310500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1552500  |
| value_loss         | 1.51e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.995    |
| fps                | 915      |
| nupdates           | 310600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.367    |
| fps                | 916      |
| nupdates           | 313400   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1567000  |
| value_loss         | 7.02e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.43     |
| fps                | 916      |
| nupdates           | 313500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1567500  |
| value_loss         | 1.9e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.828    |
| fps                | 916      |
| nupdates           | 313600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1568000  |
| value_loss         | 5.18e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.75    |
| fps                | 916      |
| nupdates           | 313700   |
| policy_entropy     | 1.93     |
| total_timest

---------------------------------
| explained_variance | -5.42    |
| fps                | 915      |
| nupdates           | 316400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1582000  |
| value_loss         | 0.00107  |
---------------------------------
---------------------------------
| explained_variance | -17.2    |
| fps                | 915      |
| nupdates           | 316500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1582500  |
| value_loss         | 0.000887 |
---------------------------------
---------------------------------
| explained_variance | 0.508    |
| fps                | 915      |
| nupdates           | 316600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1583000  |
| value_loss         | 3.94e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.986    |
| fps                | 915      |
| nupdates           | 316700   |
| policy_entropy     | 2.03     |
| total_timest

---------------------------------
| explained_variance | -0.504   |
| fps                | 916      |
| nupdates           | 319500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1597500  |
| value_loss         | 0.000482 |
---------------------------------
---------------------------------
| explained_variance | 0.474    |
| fps                | 917      |
| nupdates           | 319600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1598000  |
| value_loss         | 0.000187 |
---------------------------------
---------------------------------
| explained_variance | 0.435    |
| fps                | 917      |
| nupdates           | 319700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1598500  |
| value_loss         | 0.000412 |
---------------------------------
---------------------------------
| explained_variance | -0.324   |
| fps                | 917      |
| nupdates           | 319800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.89     |
| fps                | 915      |
| nupdates           | 322500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1612500  |
| value_loss         | 6.12e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.502   |
| fps                | 915      |
| nupdates           | 322600   |
| policy_entropy     | 1.98     |
| total_timesteps    | 1613000  |
| value_loss         | 0.000289 |
---------------------------------
---------------------------------
| explained_variance | 0.0471   |
| fps                | 915      |
| nupdates           | 322700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1613500  |
| value_loss         | 2.64e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.09    |
| fps                | 915      |
| nupdates           | 322800   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.759    |
| fps                | 914      |
| nupdates           | 325500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1627500  |
| value_loss         | 0.000158 |
---------------------------------
---------------------------------
| explained_variance | -2.38    |
| fps                | 914      |
| nupdates           | 325600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1628000  |
| value_loss         | 0.000339 |
---------------------------------
---------------------------------
| explained_variance | 0.123    |
| fps                | 914      |
| nupdates           | 325700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1628500  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 914      |
| nupdates           | 325800   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.592    |
| fps                | 915      |
| nupdates           | 328600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1643000  |
| value_loss         | 0.000143 |
---------------------------------
---------------------------------
| explained_variance | -0.148   |
| fps                | 915      |
| nupdates           | 328700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1643500  |
| value_loss         | 0.00115  |
---------------------------------
---------------------------------
| explained_variance | -0.22    |
| fps                | 915      |
| nupdates           | 328800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1644000  |
| value_loss         | 1.64e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.317    |
| fps                | 915      |
| nupdates           | 328900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | 0.924    |
| fps                | 914      |
| nupdates           | 331600   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1658000  |
| value_loss         | 0.000187 |
---------------------------------
---------------------------------
| explained_variance | 0.887    |
| fps                | 914      |
| nupdates           | 331700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1658500  |
| value_loss         | 4.11e-05 |
---------------------------------
---------------------------------
| explained_variance | -81.1    |
| fps                | 914      |
| nupdates           | 331800   |
| policy_entropy     | 2.01     |
| total_timesteps    | 1659000  |
| value_loss         | 0.00424  |
---------------------------------
---------------------------------
| explained_variance | -1.27    |
| fps                | 914      |
| nupdates           | 331900   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.137   |
| fps                | 915      |
| nupdates           | 334700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1673500  |
| value_loss         | 0.000316 |
---------------------------------
---------------------------------
| explained_variance | -56.7    |
| fps                | 915      |
| nupdates           | 334800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1674000  |
| value_loss         | 0.00102  |
---------------------------------
---------------------------------
| explained_variance | 0.0658   |
| fps                | 915      |
| nupdates           | 334900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1674500  |
| value_loss         | 0.000297 |
---------------------------------
Eval num_timesteps=1675000, episode_reward=-4.80 +/- 0.40
Episode length: 625.80 +/- 104.17
---------------------------------
| explained_variance | 0.832    |
| fps                | 9

---------------------------------
| explained_variance | 0.204    |
| fps                | 914      |
| nupdates           | 337700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1688500  |
| value_loss         | 0.000151 |
---------------------------------
---------------------------------
| explained_variance | 0.862    |
| fps                | 914      |
| nupdates           | 337800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1689000  |
| value_loss         | 0.000189 |
---------------------------------
---------------------------------
| explained_variance | 0.997    |
| fps                | 914      |
| nupdates           | 337900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1689500  |
| value_loss         | 9.59e-07 |
---------------------------------
---------------------------------
| explained_variance | -2.03    |
| fps                | 914      |
| nupdates           | 338000   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -1.2     |
| fps                | 913      |
| nupdates           | 340700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1703500  |
| value_loss         | 9.43e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.177   |
| fps                | 913      |
| nupdates           | 340800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1704000  |
| value_loss         | 0.000205 |
---------------------------------
---------------------------------
| explained_variance | 0.91     |
| fps                | 913      |
| nupdates           | 340900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1704500  |
| value_loss         | 1.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.424    |
| fps                | 913      |
| nupdates           | 341000   |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | -1.77    |
| fps                | 914      |
| nupdates           | 343800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1719000  |
| value_loss         | 0.000594 |
---------------------------------
---------------------------------
| explained_variance | -4.12    |
| fps                | 914      |
| nupdates           | 343900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1719500  |
| value_loss         | 0.00196  |
---------------------------------
---------------------------------
| explained_variance | -18.9    |
| fps                | 914      |
| nupdates           | 344000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1720000  |
| value_loss         | 0.00403  |
---------------------------------
---------------------------------
| explained_variance | -40.5    |
| fps                | 914      |
| nupdates           | 344100   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | -0.151   |
| fps                | 913      |
| nupdates           | 346800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1734000  |
| value_loss         | 4.21e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.867   |
| fps                | 913      |
| nupdates           | 346900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1734500  |
| value_loss         | 0.00133  |
---------------------------------
---------------------------------
| explained_variance | 0.845    |
| fps                | 914      |
| nupdates           | 347000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1735000  |
| value_loss         | 0.000105 |
---------------------------------
---------------------------------
| explained_variance | 0.706    |
| fps                | 914      |
| nupdates           | 347100   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -2.78    |
| fps                | 915      |
| nupdates           | 349900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1749500  |
| value_loss         | 0.00168  |
---------------------------------
Eval num_timesteps=1750000, episode_reward=-4.80 +/- 0.40
Episode length: 542.90 +/- 37.28
---------------------------------
| explained_variance | 0.131    |
| fps                | 913      |
| nupdates           | 350000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1750000  |
| value_loss         | 0.000171 |
---------------------------------
---------------------------------
| explained_variance | -0.103   |
| fps                | 913      |
| nupdates           | 350100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1750500  |
| value_loss         | 0.000443 |
---------------------------------
---------------------------------
| explained_variance | 0.203    |
| fps                | 91

---------------------------------
| explained_variance | -1.51    |
| fps                | 914      |
| nupdates           | 352900   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1764500  |
| value_loss         | 0.000226 |
---------------------------------
---------------------------------
| explained_variance | -0.0181  |
| fps                | 914      |
| nupdates           | 353000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1765000  |
| value_loss         | 0.16     |
---------------------------------
---------------------------------
| explained_variance | 0.0372   |
| fps                | 914      |
| nupdates           | 353100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1765500  |
| value_loss         | 0.000257 |
---------------------------------
---------------------------------
| explained_variance | -58.9    |
| fps                | 914      |
| nupdates           | 353200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.133   |
| fps                | 914      |
| nupdates           | 355900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1779500  |
| value_loss         | 1.42e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.751    |
| fps                | 914      |
| nupdates           | 356000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1780000  |
| value_loss         | 4.72e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.644    |
| fps                | 914      |
| nupdates           | 356100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1780500  |
| value_loss         | 8.18e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.583   |
| fps                | 914      |
| nupdates           | 356200   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -9.84    |
| fps                | 915      |
| nupdates           | 359000   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1795000  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.666    |
| fps                | 915      |
| nupdates           | 359100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1795500  |
| value_loss         | 5.52e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0564   |
| fps                | 915      |
| nupdates           | 359200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1796000  |
| value_loss         | 0.000318 |
---------------------------------
---------------------------------
| explained_variance | -8.03    |
| fps                | 915      |
| nupdates           | 359300   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.318    |
| fps                | 915      |
| nupdates           | 362000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1810000  |
| value_loss         | 0.00011  |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 915      |
| nupdates           | 362100   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1810500  |
| value_loss         | 0.000584 |
---------------------------------
---------------------------------
| explained_variance | -0.503   |
| fps                | 915      |
| nupdates           | 362200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1811000  |
| value_loss         | 0.00013  |
---------------------------------
---------------------------------
| explained_variance | 0.472    |
| fps                | 915      |
| nupdates           | 362300   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -33.4    |
| fps                | 913      |
| nupdates           | 365100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1825500  |
| value_loss         | 0.000687 |
---------------------------------
---------------------------------
| explained_variance | -1.56    |
| fps                | 913      |
| nupdates           | 365200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1826000  |
| value_loss         | 0.000147 |
---------------------------------
---------------------------------
| explained_variance | -1.69    |
| fps                | 913      |
| nupdates           | 365300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1826500  |
| value_loss         | 0.000259 |
---------------------------------
---------------------------------
| explained_variance | 0.257    |
| fps                | 914      |
| nupdates           | 365400   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.232   |
| fps                | 915      |
| nupdates           | 368200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1841000  |
| value_loss         | 3.07e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.622    |
| fps                | 915      |
| nupdates           | 368300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1841500  |
| value_loss         | 0.000532 |
---------------------------------
---------------------------------
| explained_variance | 0.645    |
| fps                | 915      |
| nupdates           | 368400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1842000  |
| value_loss         | 0.000214 |
---------------------------------
---------------------------------
| explained_variance | 0.00337  |
| fps                | 914      |
| nupdates           | 368500   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.941    |
| fps                | 913      |
| nupdates           | 371200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1856000  |
| value_loss         | 2.56e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.307    |
| fps                | 913      |
| nupdates           | 371300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1856500  |
| value_loss         | 0.000206 |
---------------------------------
---------------------------------
| explained_variance | -1.82    |
| fps                | 913      |
| nupdates           | 371400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1857000  |
| value_loss         | 0.000769 |
---------------------------------
---------------------------------
| explained_variance | 0.883    |
| fps                | 913      |
| nupdates           | 371500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.37     |
| fps                | 914      |
| nupdates           | 374300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1871500  |
| value_loss         | 0.147    |
---------------------------------
---------------------------------
| explained_variance | 0.937    |
| fps                | 914      |
| nupdates           | 374400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1872000  |
| value_loss         | 8.36e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.559    |
| fps                | 914      |
| nupdates           | 374500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1872500  |
| value_loss         | 0.000176 |
---------------------------------
---------------------------------
| explained_variance | 0.903    |
| fps                | 914      |
| nupdates           | 374600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -0.727   |
| fps                | 913      |
| nupdates           | 377300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 1886500  |
| value_loss         | 6.18e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.928    |
| fps                | 913      |
| nupdates           | 377400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1887000  |
| value_loss         | 9.27e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.991    |
| fps                | 913      |
| nupdates           | 377500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1887500  |
| value_loss         | 2.57e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.563    |
| fps                | 913      |
| nupdates           | 377600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.667    |
| fps                | 913      |
| nupdates           | 380300   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1901500  |
| value_loss         | 5.31e-05 |
---------------------------------
---------------------------------
| explained_variance | -4.65    |
| fps                | 913      |
| nupdates           | 380400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1902000  |
| value_loss         | 0.00269  |
---------------------------------
---------------------------------
| explained_variance | -0.317   |
| fps                | 913      |
| nupdates           | 380500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1902500  |
| value_loss         | 6.14e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.944    |
| fps                | 913      |
| nupdates           | 380600   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.64     |
| fps                | 914      |
| nupdates           | 383400   |
| policy_entropy     | 2.02     |
| total_timesteps    | 1917000  |
| value_loss         | 9.3e-05  |
---------------------------------
---------------------------------
| explained_variance | -1.28    |
| fps                | 914      |
| nupdates           | 383500   |
| policy_entropy     | 1.98     |
| total_timesteps    | 1917500  |
| value_loss         | 0.000392 |
---------------------------------
---------------------------------
| explained_variance | -1.35    |
| fps                | 914      |
| nupdates           | 383600   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1918000  |
| value_loss         | 0.000157 |
---------------------------------
---------------------------------
| explained_variance | -2.2     |
| fps                | 914      |
| nupdates           | 383700   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.838    |
| fps                | 913      |
| nupdates           | 386400   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1932000  |
| value_loss         | 2.44e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.701    |
| fps                | 913      |
| nupdates           | 386500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 1932500  |
| value_loss         | 3.99e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.643    |
| fps                | 913      |
| nupdates           | 386600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1933000  |
| value_loss         | 0.000564 |
---------------------------------
---------------------------------
| explained_variance | 0.998    |
| fps                | 913      |
| nupdates           | 386700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -7.22    |
| fps                | 914      |
| nupdates           | 389500   |
| policy_entropy     | 2.03     |
| total_timesteps    | 1947500  |
| value_loss         | 0.00329  |
---------------------------------
---------------------------------
| explained_variance | -0.214   |
| fps                | 914      |
| nupdates           | 389600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1948000  |
| value_loss         | 0.000191 |
---------------------------------
---------------------------------
| explained_variance | -1.63    |
| fps                | 914      |
| nupdates           | 389700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1948500  |
| value_loss         | 0.00337  |
---------------------------------
---------------------------------
| explained_variance | -4.39    |
| fps                | 914      |
| nupdates           | 389800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.955    |
| fps                | 913      |
| nupdates           | 392500   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1962500  |
| value_loss         | 3.66e-05 |
---------------------------------
----------------------------------
| explained_variance | -7.49e+03 |
| fps                | 913       |
| nupdates           | 392600    |
| policy_entropy     | 2.05      |
| total_timesteps    | 1963000   |
| value_loss         | 0.136     |
----------------------------------
---------------------------------
| explained_variance | 0.951    |
| fps                | 913      |
| nupdates           | 392700   |
| policy_entropy     | 2.04     |
| total_timesteps    | 1963500  |
| value_loss         | 0.000103 |
---------------------------------
---------------------------------
| explained_variance | -0.746   |
| fps                | 914      |
| nupdates           | 392800   |
| policy_entropy     | 2.06     |
| tota

---------------------------------
| explained_variance | 0.902    |
| fps                | 912      |
| nupdates           | 395500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1977500  |
| value_loss         | 9.96e-05 |
---------------------------------
---------------------------------
| explained_variance | -13.5    |
| fps                | 912      |
| nupdates           | 395600   |
| policy_entropy     | 1.98     |
| total_timesteps    | 1978000  |
| value_loss         | 0.00471  |
---------------------------------
---------------------------------
| explained_variance | -17.2    |
| fps                | 912      |
| nupdates           | 395700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 1978500  |
| value_loss         | 0.00415  |
---------------------------------
---------------------------------
| explained_variance | 0.996    |
| fps                | 912      |
| nupdates           | 395800   |
| policy_entropy     | 1.97     |
| total_timest

---------------------------------
| explained_variance | 0.999    |
| fps                | 913      |
| nupdates           | 398600   |
| policy_entropy     | 1.97     |
| total_timesteps    | 1993000  |
| value_loss         | 3.85e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.132    |
| fps                | 913      |
| nupdates           | 398700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1993500  |
| value_loss         | 6.82e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.321   |
| fps                | 913      |
| nupdates           | 398800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 1994000  |
| value_loss         | 0.000132 |
---------------------------------
---------------------------------
| explained_variance | 0.877    |
| fps                | 913      |
| nupdates           | 398900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.912    |
| fps                | 912      |
| nupdates           | 401600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2008000  |
| value_loss         | 2.99e-06 |
---------------------------------
---------------------------------
| explained_variance | -0.611   |
| fps                | 912      |
| nupdates           | 401700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2008500  |
| value_loss         | 0.00093  |
---------------------------------
---------------------------------
| explained_variance | 0.593    |
| fps                | 912      |
| nupdates           | 401800   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2009000  |
| value_loss         | 2.96e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.78    |
| fps                | 912      |
| nupdates           | 401900   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.043    |
| fps                | 913      |
| nupdates           | 404700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2023500  |
| value_loss         | 0.00152  |
---------------------------------
---------------------------------
| explained_variance | 0.0236   |
| fps                | 913      |
| nupdates           | 404800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2024000  |
| value_loss         | 1.01e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.0964   |
| fps                | 913      |
| nupdates           | 404900   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2024500  |
| value_loss         | 8.21e-05 |
---------------------------------
Eval num_timesteps=2025000, episode_reward=-4.90 +/- 0.30
Episode length: 627.10 +/- 154.50
---------------------------------
| explained_variance | -0.254   |
| fps                | 9

---------------------------------
| explained_variance | -1.09    |
| fps                | 911      |
| nupdates           | 407700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2038500  |
| value_loss         | 4.06e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.475    |
| fps                | 911      |
| nupdates           | 407800   |
| policy_entropy     | 2        |
| total_timesteps    | 2039000  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.279    |
| fps                | 911      |
| nupdates           | 407900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2039500  |
| value_loss         | 0.000357 |
---------------------------------
---------------------------------
| explained_variance | -1.06    |
| fps                | 911      |
| nupdates           | 408000   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.83     |
| fps                | 909      |
| nupdates           | 410700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2053500  |
| value_loss         | 0.00023  |
---------------------------------
---------------------------------
| explained_variance | -0.715   |
| fps                | 909      |
| nupdates           | 410800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2054000  |
| value_loss         | 0.000374 |
---------------------------------
---------------------------------
| explained_variance | -6.97    |
| fps                | 909      |
| nupdates           | 410900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2054500  |
| value_loss         | 0.000625 |
---------------------------------
---------------------------------
| explained_variance | -892     |
| fps                | 909      |
| nupdates           | 411000   |
| policy_entropy     | 1.89     |
| total_timest

---------------------------------
| explained_variance | 0.236    |
| fps                | 909      |
| nupdates           | 413800   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2069000  |
| value_loss         | 8.19e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.993    |
| fps                | 909      |
| nupdates           | 413900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2069500  |
| value_loss         | 2.29e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.868    |
| fps                | 909      |
| nupdates           | 414000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2070000  |
| value_loss         | 9.19e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.0195  |
| fps                | 909      |
| nupdates           | 414100   |
| policy_entropy     | 1.93     |
| total_timest

---------------------------------
| explained_variance | -22.1    |
| fps                | 907      |
| nupdates           | 416800   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2084000  |
| value_loss         | 0.000611 |
---------------------------------
---------------------------------
| explained_variance | -0.409   |
| fps                | 907      |
| nupdates           | 416900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2084500  |
| value_loss         | 0.000238 |
---------------------------------
---------------------------------
| explained_variance | 0.661    |
| fps                | 907      |
| nupdates           | 417000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2085000  |
| value_loss         | 3.6e-05  |
---------------------------------
---------------------------------
| explained_variance | 0.862    |
| fps                | 907      |
| nupdates           | 417100   |
| policy_entropy     | 1.96     |
| total_timest

---------------------------------
| explained_variance | 0.654    |
| fps                | 907      |
| nupdates           | 419900   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2099500  |
| value_loss         | 2.09e-05 |
---------------------------------
Eval num_timesteps=2100000, episode_reward=-4.80 +/- 0.40
Episode length: 629.90 +/- 98.77
---------------------------------
| explained_variance | 0.627    |
| fps                | 906      |
| nupdates           | 420000   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2100000  |
| value_loss         | 3.68e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.92    |
| fps                | 906      |
| nupdates           | 420100   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2100500  |
| value_loss         | 2.77e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.15    |
| fps                | 90

---------------------------------
| explained_variance | -2.42    |
| fps                | 906      |
| nupdates           | 422900   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2114500  |
| value_loss         | 0.000398 |
---------------------------------
---------------------------------
| explained_variance | -3.85    |
| fps                | 906      |
| nupdates           | 423000   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2115000  |
| value_loss         | 0.000779 |
---------------------------------
---------------------------------
| explained_variance | 0.452    |
| fps                | 905      |
| nupdates           | 423100   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2115500  |
| value_loss         | 0.000248 |
---------------------------------
---------------------------------
| explained_variance | -0.593   |
| fps                | 905      |
| nupdates           | 423200   |
| policy_entropy     | 2.04     |
| total_timest

---------------------------------
| explained_variance | 0.312    |
| fps                | 903      |
| nupdates           | 425900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2129500  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | 0.881    |
| fps                | 903      |
| nupdates           | 426000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2130000  |
| value_loss         | 9.04e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.021   |
| fps                | 903      |
| nupdates           | 426100   |
| policy_entropy     | 1.8      |
| total_timesteps    | 2130500  |
| value_loss         | 0.403    |
---------------------------------
---------------------------------
| explained_variance | 0.612    |
| fps                | 903      |
| nupdates           | 426200   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.662    |
| fps                | 903      |
| nupdates           | 429000   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2145000  |
| value_loss         | 2.88e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 903      |
| nupdates           | 429100   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2145500  |
| value_loss         | 2.25e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.377    |
| fps                | 903      |
| nupdates           | 429200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2146000  |
| value_loss         | 3.32e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.983    |
| fps                | 903      |
| nupdates           | 429300   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -6.62    |
| fps                | 902      |
| nupdates           | 432000   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2160000  |
| value_loss         | 0.000327 |
---------------------------------
---------------------------------
| explained_variance | -3.41    |
| fps                | 902      |
| nupdates           | 432100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2160500  |
| value_loss         | 0.00113  |
---------------------------------
---------------------------------
| explained_variance | -2.78    |
| fps                | 902      |
| nupdates           | 432200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2161000  |
| value_loss         | 0.00023  |
---------------------------------
---------------------------------
| explained_variance | 0.667    |
| fps                | 902      |
| nupdates           | 432300   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.736    |
| fps                | 900      |
| nupdates           | 435100   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2175500  |
| value_loss         | 6.76e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.795    |
| fps                | 900      |
| nupdates           | 435200   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2176000  |
| value_loss         | 4.8e-05  |
---------------------------------
---------------------------------
| explained_variance | -0.295   |
| fps                | 900      |
| nupdates           | 435300   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2176500  |
| value_loss         | 0.000432 |
---------------------------------
---------------------------------
| explained_variance | -0.00521 |
| fps                | 900      |
| nupdates           | 435400   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.706    |
| fps                | 900      |
| nupdates           | 438200   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2191000  |
| value_loss         | 6.01e-06 |
---------------------------------
---------------------------------
| explained_variance | -5.61    |
| fps                | 900      |
| nupdates           | 438300   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2191500  |
| value_loss         | 0.000236 |
---------------------------------
---------------------------------
| explained_variance | 0.966    |
| fps                | 900      |
| nupdates           | 438400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2192000  |
| value_loss         | 1.09e-05 |
---------------------------------
---------------------------------
| explained_variance | -2.95    |
| fps                | 900      |
| nupdates           | 438500   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -4.34    |
| fps                | 899      |
| nupdates           | 441200   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2206000  |
| value_loss         | 0.000107 |
---------------------------------
---------------------------------
| explained_variance | 0.466    |
| fps                | 899      |
| nupdates           | 441300   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2206500  |
| value_loss         | 4.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.239   |
| fps                | 899      |
| nupdates           | 441400   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2207000  |
| value_loss         | 0.000226 |
---------------------------------
---------------------------------
| explained_variance | 0.629    |
| fps                | 899      |
| nupdates           | 441500   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.677    |
| fps                | 899      |
| nupdates           | 444300   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2221500  |
| value_loss         | 6.95e-05 |
---------------------------------
---------------------------------
| explained_variance | -3.02    |
| fps                | 899      |
| nupdates           | 444400   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2222000  |
| value_loss         | 0.00195  |
---------------------------------
---------------------------------
| explained_variance | 0.618    |
| fps                | 899      |
| nupdates           | 444500   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2222500  |
| value_loss         | 0.000161 |
---------------------------------
---------------------------------
| explained_variance | 0.671    |
| fps                | 899      |
| nupdates           | 444600   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.63     |
| fps                | 897      |
| nupdates           | 447300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2236500  |
| value_loss         | 8.04e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.572    |
| fps                | 897      |
| nupdates           | 447400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2237000  |
| value_loss         | 0.000108 |
---------------------------------
---------------------------------
| explained_variance | 0.589    |
| fps                | 897      |
| nupdates           | 447500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2237500  |
| value_loss         | 0.000222 |
---------------------------------
---------------------------------
| explained_variance | -1.41    |
| fps                | 897      |
| nupdates           | 447600   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | -11.3    |
| fps                | 895      |
| nupdates           | 450300   |
| policy_entropy     | 2.05     |
| total_timesteps    | 2251500  |
| value_loss         | 0.00259  |
---------------------------------
---------------------------------
| explained_variance | 0.943    |
| fps                | 895      |
| nupdates           | 450400   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2252000  |
| value_loss         | 5.85e-06 |
---------------------------------
---------------------------------
| explained_variance | 0.0768   |
| fps                | 895      |
| nupdates           | 450500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2252500  |
| value_loss         | 5.96e-05 |
---------------------------------
---------------------------------
| explained_variance | -0.173   |
| fps                | 895      |
| nupdates           | 450600   |
| policy_entropy     | 1.95     |
| total_timest

---------------------------------
| explained_variance | 0.298    |
| fps                | 895      |
| nupdates           | 453400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2267000  |
| value_loss         | 1.87e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.855    |
| fps                | 895      |
| nupdates           | 453500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2267500  |
| value_loss         | 1.76e-05 |
---------------------------------
---------------------------------
| explained_variance | -1.14    |
| fps                | 895      |
| nupdates           | 453600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2268000  |
| value_loss         | 0.000435 |
---------------------------------
---------------------------------
| explained_variance | 0.678    |
| fps                | 895      |
| nupdates           | 453700   |
| policy_entropy     | 2.08     |
| total_timest

---------------------------------
| explained_variance | 0.807    |
| fps                | 894      |
| nupdates           | 456400   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2282000  |
| value_loss         | 0.000116 |
---------------------------------
---------------------------------
| explained_variance | -1       |
| fps                | 894      |
| nupdates           | 456500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2282500  |
| value_loss         | 0.000586 |
---------------------------------
---------------------------------
| explained_variance | -0.157   |
| fps                | 894      |
| nupdates           | 456600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2283000  |
| value_loss         | 0.000199 |
---------------------------------
---------------------------------
| explained_variance | -30.7    |
| fps                | 894      |
| nupdates           | 456700   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.569    |
| fps                | 894      |
| nupdates           | 459500   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2297500  |
| value_loss         | 6.43e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.898    |
| fps                | 894      |
| nupdates           | 459600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2298000  |
| value_loss         | 8.46e-05 |
---------------------------------
---------------------------------
| explained_variance | 0.343    |
| fps                | 894      |
| nupdates           | 459700   |
| policy_entropy     | 2.08     |
| total_timesteps    | 2298500  |
| value_loss         | 0.000168 |
---------------------------------
---------------------------------
| explained_variance | 0.269    |
| fps                | 894      |
| nupdates           | 459800   |
| policy_entropy     | 2.07     |
| total_timest

---------------------------------
| explained_variance | 0.862    |
| fps                | 893      |
| nupdates           | 462500   |
| policy_entropy     | 2        |
| total_timesteps    | 2312500  |
| value_loss         | 3.89e-05 |
---------------------------------
---------------------------------
| explained_variance | -28.4    |
| fps                | 893      |
| nupdates           | 462600   |
| policy_entropy     | 2        |
| total_timesteps    | 2313000  |
| value_loss         | 0.00129  |
---------------------------------
---------------------------------
| explained_variance | -10.9    |
| fps                | 893      |
| nupdates           | 462700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2313500  |
| value_loss         | 0.0033   |
---------------------------------
---------------------------------
| explained_variance | 0.615    |
| fps                | 893      |
| nupdates           | 462800   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | -0.267   |
| fps                | 892      |
| nupdates           | 465500   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2327500  |
| value_loss         | 0.00012  |
---------------------------------
---------------------------------
| explained_variance | -8.96    |
| fps                | 892      |
| nupdates           | 465600   |
| policy_entropy     | 1.92     |
| total_timesteps    | 2328000  |
| value_loss         | 0.00762  |
---------------------------------
---------------------------------
| explained_variance | -7.64    |
| fps                | 892      |
| nupdates           | 465700   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2328500  |
| value_loss         | 0.0042   |
---------------------------------
---------------------------------
| explained_variance | -0.28    |
| fps                | 892      |
| nupdates           | 465800   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -0.0165  |
| fps                | 892      |
| nupdates           | 468600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2343000  |
| value_loss         | 0.000153 |
---------------------------------
---------------------------------
| explained_variance | -2.3     |
| fps                | 892      |
| nupdates           | 468700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2343500  |
| value_loss         | 0.000141 |
---------------------------------
---------------------------------
| explained_variance | 0.866    |
| fps                | 892      |
| nupdates           | 468800   |
| policy_entropy     | 2.04     |
| total_timesteps    | 2344000  |
| value_loss         | 2.8e-05  |
---------------------------------
---------------------------------
| explained_variance | -3.19    |
| fps                | 892      |
| nupdates           | 468900   |
| policy_entropy     | 2.06     |
| total_timest

---------------------------------
| explained_variance | 0.926    |
| fps                | 890      |
| nupdates           | 471600   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2358000  |
| value_loss         | 6.07e-05 |
---------------------------------
---------------------------------
| explained_variance | -15.5    |
| fps                | 890      |
| nupdates           | 471700   |
| policy_entropy     | 2.02     |
| total_timesteps    | 2358500  |
| value_loss         | 0.00489  |
---------------------------------
---------------------------------
| explained_variance | -0.137   |
| fps                | 890      |
| nupdates           | 471800   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2359000  |
| value_loss         | 0.000327 |
---------------------------------
---------------------------------
| explained_variance | -0.122   |
| fps                | 890      |
| nupdates           | 471900   |
| policy_entropy     | 2.05     |
| total_timest

---------------------------------
| explained_variance | -7.58    |
| fps                | 890      |
| nupdates           | 474700   |
| policy_entropy     | 2.06     |
| total_timesteps    | 2373500  |
| value_loss         | 0.00191  |
---------------------------------
---------------------------------
| explained_variance | -3.63    |
| fps                | 890      |
| nupdates           | 474800   |
| policy_entropy     | 2.03     |
| total_timesteps    | 2374000  |
| value_loss         | 0.00484  |
---------------------------------
---------------------------------
| explained_variance | -2.19    |
| fps                | 890      |
| nupdates           | 474900   |
| policy_entropy     | 2.07     |
| total_timesteps    | 2374500  |
| value_loss         | 0.000453 |
---------------------------------
Eval num_timesteps=2375000, episode_reward=-4.80 +/- 0.40
Episode length: 660.70 +/- 151.90
---------------------------------
| explained_variance | -2.83    |
| fps                | 8

In [None]:
video_filename = 'a2c.mp4'
record_game(
    model=trained_model['a2c'],
    env=gym.make("SlimeVolley-v0"),
    num_episodes=5,
    video_filename=video_filename
)
embed_mp4(video_filename)

In [None]:
experiment('acer')