#Environment Check

In [None]:
import gymnasium as gym
from twsbr_env.envs import TwsbrEnv
from stable_baselines3 import SAC
from stable_baselines3.common.env_util import make_vec_env
from stable_baselines3.common.vec_env import DummyVecEnv
from stable_baselines3.common.callbacks import CheckpointCallback

# ================================
# Pelatihan dengan Vectorized Environment
# ================================

# Buat environment vectorized TwsbrEnv-v0 (dengan 8 environment paralel)
env_train = make_vec_env("TwsbrEnv-v0", n_envs=8, vec_env_cls=DummyVecEnv)

# Definisikan hyperparameter SAC secara lengkap
sac_params = {
    "learning_rate": 5e-4,      # Kecepatan pembelajaran
    "buffer_size": 1000000,     # Kapasitas replay buffer
    "batch_size": 40960,          # Ukuran batch untuk update
    "tau": 0.005,               # Soft update target network
    "gamma": 0.99,              # Discount factor
    "ent_coef": "auto",         # Automatic entropy coefficient tuning
    "policy_kwargs": dict(net_arch=[672, 128]),  # Arsitektur jaringan
    "use_sde": True,            # Gunakan State-Dependent Exploration (SDE)
    "sde_sample_freq": 32,      # Update noise SDE setiap 64 langkah
}

# Buat model SAC dengan TensorBoard logging
model = SAC(
    "MlpPolicy",
    env_train,
    device="cuda",  # Gunakan GPU jika tersedia
    verbose=1,
    tensorboard_log="./sac_twsbr_tensorboard/",
    #**sac_params
)

# Callback untuk menyimpan model secara berkala (setiap 10.000 timesteps)
checkpoint_callback = CheckpointCallback(
    save_freq=10000,
    save_path="./sac_twsbr/",
    name_prefix="sac_twsbr"
)

# Mulai pelatihan model selama 1.000.000 timesteps dengan progress bar
model.learn(total_timesteps=2000000, progress_bar=True, callback=checkpoint_callback)

# Simpan model final
model.save("sac_twsbr_final")
print("Model telah disimpan sebagai sac_twsbr_final.zip")

# Tutup environment pelatihan
env_train.close()

# ================================
# Evaluasi Model dalam Mode Human
# ================================



Using cuda device
Logging to ./sac_twsbr_tensorboard/SAC_5


Output()

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 4.75     |
|    ep_rew_mean     | 530      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 4        |
|    fps             | 2        |
|    time_elapsed    | 13       |
|    total_timesteps | 40       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 8.62     |
|    ep_rew_mean     | 561      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 8        |
|    fps             | 7        |
|    time_elapsed    | 20       |
|    total_timesteps | 152      |
| train/             |          |
|    actor_loss      | -1.51    |
|    critic_loss     | 1.48e+04 |
|    ent_coef        | 0.999    |
|    ent_coef_loss   | -0.00503 |
|    learning_rate   | 0.0003   |
|    n_updates       | 6        |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 12.3     |
|    ep_rew_mean     | 589      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 12       |
|    fps             | 7        |
|    time_elapsed    | 25       |
|    total_timesteps | 200      |
| train/             |          |
|    actor_loss      | -1.67    |
|    critic_loss     | 1.38e+04 |
|    ent_coef        | 0.997    |
|    ent_coef_loss   | -0.011   |
|    learning_rate   | 0.0003   |
|    n_updates       | 12       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 12.2     |
|    ep_rew_mean     | 584      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 16       |
|    fps             | 7        |
|    time_elapsed    | 31       |
|    total_timesteps | 240      |
| train/             |          |
|    actor_loss      | -1.87    |
|    critic_loss     | 1.27e+04 |
|    ent_coef        | 0.995    |
|    ent_coef_loss   | -0.0162  |
|    learning_rate   | 0.0003   |
|    n_updates       | 17       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 12.1     |
|    ep_rew_mean     | 583      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 20       |
|    fps             | 8        |
|    time_elapsed    | 36       |
|    total_timesteps | 304      |
| train/             |          |
|    actor_loss      | -2.2     |
|    critic_loss     | 1.65e+04 |
|    ent_coef        | 0.993    |
|    ent_coef_loss   | -0.0245  |
|    learning_rate   | 0.0003   |
|    n_updates       | 25       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 12.3     |
|    ep_rew_mean     | 584      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 24       |
|    fps             | 8        |
|    time_elapsed    | 42       |
|    total_timesteps | 344      |
| train/             |          |
|    actor_loss      | -2.41    |
|    critic_loss     | 2.24e+04 |
|    ent_coef        | 0.991    |
|    ent_coef_loss   | -0.0293  |
|    learning_rate   | 0.0003   |
|    n_updates       | 30       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 12.1     |
|    ep_rew_mean     | 584      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 28       |
|    fps             | 7        |
|    time_elapsed    | 47       |
|    total_timesteps | 376      |
| train/             |          |
|    actor_loss      | -2.64    |
|    critic_loss     | 2.04e+04 |
|    ent_coef        | 0.99     |
|    ent_coef_loss   | -0.0333  |
|    learning_rate   | 0.0003   |
|    n_updates       | 34       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.7     |
|    ep_rew_mean     | 581      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 32       |
|    fps             | 8        |
|    time_elapsed    | 52       |
|    total_timesteps | 424      |
| train/             |          |
|    actor_loss      | -3.03    |
|    critic_loss     | 1.27e+04 |
|    ent_coef        | 0.988    |
|    ent_coef_loss   | -0.0394  |
|    learning_rate   | 0.0003   |
|    n_updates       | 40       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.9     |
|    ep_rew_mean     | 581      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 36       |
|    fps             | 8        |
|    time_elapsed    | 57       |
|    total_timesteps | 472      |
| train/             |          |
|    actor_loss      | -3.49    |
|    critic_loss     | 1.54e+04 |
|    ent_coef        | 0.987    |
|    ent_coef_loss   | -0.0454  |
|    learning_rate   | 0.0003   |
|    n_updates       | 46       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.6     |
|    ep_rew_mean     | 578      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 40       |
|    fps             | 8        |
|    time_elapsed    | 64       |
|    total_timesteps | 528      |
| train/             |          |
|    actor_loss      | -4.13    |
|    critic_loss     | 1.92e+04 |
|    ent_coef        | 0.985    |
|    ent_coef_loss   | -0.0526  |
|    learning_rate   | 0.0003   |
|    n_updates       | 53       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.6     |
|    ep_rew_mean     | 578      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 44       |
|    fps             | 8        |
|    time_elapsed    | 68       |
|    total_timesteps | 568      |
| train/             |          |
|    actor_loss      | -4.63    |
|    critic_loss     | 1.55e+04 |
|    ent_coef        | 0.983    |
|    ent_coef_loss   | -0.0575  |
|    learning_rate   | 0.0003   |
|    n_updates       | 58       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.3     |
|    ep_rew_mean     | 576      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 48       |
|    fps             | 8        |
|    time_elapsed    | 75       |
|    total_timesteps | 648      |
| train/             |          |
|    actor_loss      | -5.87    |
|    critic_loss     | 1.71e+04 |
|    ent_coef        | 0.98     |
|    ent_coef_loss   | -0.0682  |
|    learning_rate   | 0.0003   |
|    n_updates       | 68       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.6     |
|    ep_rew_mean     | 579      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 52       |
|    fps             | 8        |
|    time_elapsed    | 79       |
|    total_timesteps | 672      |
| train/             |          |
|    actor_loss      | -6.19    |
|    critic_loss     | 1.82e+04 |
|    ent_coef        | 0.979    |
|    ent_coef_loss   | -0.069   |
|    learning_rate   | 0.0003   |
|    n_updates       | 71       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 12.2     |
|    ep_rew_mean     | 582      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 56       |
|    fps             | 8        |
|    time_elapsed    | 84       |
|    total_timesteps | 712      |
| train/             |          |
|    actor_loss      | -7.03    |
|    critic_loss     | 1.05e+04 |
|    ent_coef        | 0.978    |
|    ent_coef_loss   | -0.0743  |
|    learning_rate   | 0.0003   |
|    n_updates       | 76       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.9     |
|    ep_rew_mean     | 580      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 60       |
|    fps             | 8        |
|    time_elapsed    | 90       |
|    total_timesteps | 760      |
| train/             |          |
|    actor_loss      | -8.08    |
|    critic_loss     | 2.36e+04 |
|    ent_coef        | 0.976    |
|    ent_coef_loss   | -0.0804  |
|    learning_rate   | 0.0003   |
|    n_updates       | 82       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.7     |
|    ep_rew_mean     | 579      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 64       |
|    fps             | 8        |
|    time_elapsed    | 95       |
|    total_timesteps | 800      |
| train/             |          |
|    actor_loss      | -8.91    |
|    critic_loss     | 2.75e+04 |
|    ent_coef        | 0.975    |
|    ent_coef_loss   | -0.0845  |
|    learning_rate   | 0.0003   |
|    n_updates       | 87       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.7     |
|    ep_rew_mean     | 579      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 68       |
|    fps             | 8        |
|    time_elapsed    | 101      |
|    total_timesteps | 832      |
| train/             |          |
|    actor_loss      | -9.93    |
|    critic_loss     | 1.5e+04  |
|    ent_coef        | 0.973    |
|    ent_coef_loss   | -0.0871  |
|    learning_rate   | 0.0003   |
|    n_updates       | 91       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.6     |
|    ep_rew_mean     | 579      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 72       |
|    fps             | 8        |
|    time_elapsed    | 105      |
|    total_timesteps | 864      |
| train/             |          |
|    actor_loss      | -11      |
|    critic_loss     | 1.4e+04  |
|    ent_coef        | 0.972    |
|    ent_coef_loss   | -0.0914  |
|    learning_rate   | 0.0003   |
|    n_updates       | 95       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.4     |
|    ep_rew_mean     | 578      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 76       |
|    fps             | 8        |
|    time_elapsed    | 110      |
|    total_timesteps | 896      |
| train/             |          |
|    actor_loss      | -11.9    |
|    critic_loss     | 1.68e+04 |
|    ent_coef        | 0.971    |
|    ent_coef_loss   | -0.0909  |
|    learning_rate   | 0.0003   |
|    n_updates       | 99       |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.3     |
|    ep_rew_mean     | 578      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 80       |
|    fps             | 8        |
|    time_elapsed    | 115      |
|    total_timesteps | 944      |
| train/             |          |
|    actor_loss      | -13.7    |
|    critic_loss     | 1.57e+04 |
|    ent_coef        | 0.969    |
|    ent_coef_loss   | -0.0925  |
|    learning_rate   | 0.0003   |
|    n_updates       | 105      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.2     |
|    ep_rew_mean     | 577      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 84       |
|    fps             | 8        |
|    time_elapsed    | 122      |
|    total_timesteps | 1000     |
| train/             |          |
|    actor_loss      | -16.5    |
|    critic_loss     | 1.82e+04 |
|    ent_coef        | 0.968    |
|    ent_coef_loss   | -0.0936  |
|    learning_rate   | 0.0003   |
|    n_updates       | 112      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11.1     |
|    ep_rew_mean     | 577      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 88       |
|    fps             | 8        |
|    time_elapsed    | 125      |
|    total_timesteps | 1016     |
| train/             |          |
|    actor_loss      | -17      |
|    critic_loss     | 2.38e+04 |
|    ent_coef        | 0.967    |
|    ent_coef_loss   | -0.0919  |
|    learning_rate   | 0.0003   |
|    n_updates       | 114      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 11       |
|    ep_rew_mean     | 576      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 92       |
|    fps             | 7        |
|    time_elapsed    | 133      |
|    total_timesteps | 1040     |
| train/             |          |
|    actor_loss      | -17.9    |
|    critic_loss     | 2.71e+04 |
|    ent_coef        | 0.966    |
|    ent_coef_loss   | -0.0884  |
|    learning_rate   | 0.0003   |
|    n_updates       | 117      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 10.8     |
|    ep_rew_mean     | 574      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 96       |
|    fps             | 7        |
|    time_elapsed    | 139      |
|    total_timesteps | 1048     |
| train/             |          |
|    actor_loss      | -18.7    |
|    critic_loss     | 2.07e+04 |
|    ent_coef        | 0.966    |
|    ent_coef_loss   | -0.0867  |
|    learning_rate   | 0.0003   |
|    n_updates       | 118      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 10.5     |
|    ep_rew_mean     | 572      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 100      |
|    fps             | 7        |
|    time_elapsed    | 147      |
|    total_timesteps | 1072     |
| train/             |          |
|    actor_loss      | -19.5    |
|    critic_loss     | 1.62e+04 |
|    ent_coef        | 0.965    |
|    ent_coef_loss   | -0.0874  |
|    learning_rate   | 0.0003   |
|    n_updates       | 121      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 10.5     |
|    ep_rew_mean     | 571      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 104      |
|    fps             | 7        |
|    time_elapsed    | 154      |
|    total_timesteps | 1088     |
| train/             |          |
|    actor_loss      | -21.6    |
|    critic_loss     | 3.02e+04 |
|    ent_coef        | 0.965    |
|    ent_coef_loss   | -0.0783  |
|    learning_rate   | 0.0003   |
|    n_updates       | 123      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 10.2     |
|    ep_rew_mean     | 569      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 108      |
|    fps             | 6        |
|    time_elapsed    | 158      |
|    total_timesteps | 1104     |
| train/             |          |
|    actor_loss      | -22      |
|    critic_loss     | 2.29e+04 |
|    ent_coef        | 0.964    |
|    ent_coef_loss   | -0.0759  |
|    learning_rate   | 0.0003   |
|    n_updates       | 125      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 9.32     |
|    ep_rew_mean     | 563      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 112      |
|    fps             | 6        |
|    time_elapsed    | 167      |
|    total_timesteps | 1136     |
| train/             |          |
|    actor_loss      | -24.8    |
|    critic_loss     | 2.47e+04 |
|    ent_coef        | 0.963    |
|    ent_coef_loss   | -0.065   |
|    learning_rate   | 0.0003   |
|    n_updates       | 129      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 9.32     |
|    ep_rew_mean     | 563      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 116      |
|    fps             | 6        |
|    time_elapsed    | 167      |
|    total_timesteps | 1136     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 9.02     |
|    ep_rew_mean     | 561      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 120      |
|    fps             | 6        |
|    time_elapsed    | 172      |
|    total_timesteps | 1160     |
| train/             |          |
|    actor_loss      | -26.1    |
|    critic_loss     | 2.34e+04 |
|    ent_coef        | 0.963    |
|    ent_coef_loss   | -0.054   |
|    learning_rate   | 0.0003   |
|    n_updates       | 132      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 8.54     |
|    ep_rew_mean     | 557      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 124      |
|    fps             | 6        |
|    time_elapsed    | 178      |
|    total_timesteps | 1176     |
| train/             |          |
|    actor_loss      | -29      |
|    critic_loss     | 2.49e+04 |
|    ent_coef        | 0.962    |
|    ent_coef_loss   | -0.045   |
|    learning_rate   | 0.0003   |
|    n_updates       | 134      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 8.4      |
|    ep_rew_mean     | 556      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 128      |
|    fps             | 6        |
|    time_elapsed    | 182      |
|    total_timesteps | 1192     |
| train/             |          |
|    actor_loss      | -29.3    |
|    critic_loss     | 1.3e+04  |
|    ent_coef        | 0.962    |
|    ent_coef_loss   | -0.0476  |
|    learning_rate   | 0.0003   |
|    n_updates       | 136      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 8.06     |
|    ep_rew_mean     | 554      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 132      |
|    fps             | 6        |
|    time_elapsed    | 187      |
|    total_timesteps | 1208     |
| train/             |          |
|    actor_loss      | -31.4    |
|    critic_loss     | 2.48e+04 |
|    ent_coef        | 0.962    |
|    ent_coef_loss   | -0.0384  |
|    learning_rate   | 0.0003   |
|    n_updates       | 138      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 7.74     |
|    ep_rew_mean     | 552      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 136      |
|    fps             | 6        |
|    time_elapsed    | 192      |
|    total_timesteps | 1224     |
| train/             |          |
|    actor_loss      | -33.5    |
|    critic_loss     | 2.88e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | -0.0229  |
|    learning_rate   | 0.0003   |
|    n_updates       | 140      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 7.59     |
|    ep_rew_mean     | 551      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 140      |
|    fps             | 6        |
|    time_elapsed    | 195      |
|    total_timesteps | 1232     |
| train/             |          |
|    actor_loss      | -33.7    |
|    critic_loss     | 2.64e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | -0.0297  |
|    learning_rate   | 0.0003   |
|    n_updates       | 141      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 7.15     |
|    ep_rew_mean     | 547      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 144      |
|    fps             | 6        |
|    time_elapsed    | 203      |
|    total_timesteps | 1256     |
| train/             |          |
|    actor_loss      | -36.3    |
|    critic_loss     | 2.46e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | -0.0139  |
|    learning_rate   | 0.0003   |
|    n_updates       | 144      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 7.14     |
|    ep_rew_mean     | 547      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 148      |
|    fps             | 6        |
|    time_elapsed    | 205      |
|    total_timesteps | 1264     |
| train/             |          |
|    actor_loss      | -37.1    |
|    critic_loss     | 2.53e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | -0.00914 |
|    learning_rate   | 0.0003   |
|    n_updates       | 145      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 6.29     |
|    ep_rew_mean     | 541      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 152      |
|    fps             | 6        |
|    time_elapsed    | 213      |
|    total_timesteps | 1280     |
| train/             |          |
|    actor_loss      | -38.6    |
|    critic_loss     | 1.68e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | -0.00773 |
|    learning_rate   | 0.0003   |
|    n_updates       | 147      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 5.95     |
|    ep_rew_mean     | 538      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 156      |
|    fps             | 6        |
|    time_elapsed    | 214      |
|    total_timesteps | 1288     |
| train/             |          |
|    actor_loss      | -40      |
|    critic_loss     | 1.89e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | -0.00675 |
|    learning_rate   | 0.0003   |
|    n_updates       | 148      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 5.56     |
|    ep_rew_mean     | 535      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 160      |
|    fps             | 5        |
|    time_elapsed    | 222      |
|    total_timesteps | 1304     |
| train/             |          |
|    actor_loss      | -42.3    |
|    critic_loss     | 2.66e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.00164  |
|    learning_rate   | 0.0003   |
|    n_updates       | 150      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 5.52     |
|    ep_rew_mean     | 535      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 164      |
|    fps             | 5        |
|    time_elapsed    | 223      |
|    total_timesteps | 1312     |
| train/             |          |
|    actor_loss      | -40.2    |
|    critic_loss     | 2.3e+04  |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.00451  |
|    learning_rate   | 0.0003   |
|    n_updates       | 151      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 5.14     |
|    ep_rew_mean     | 532      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 168      |
|    fps             | 5        |
|    time_elapsed    | 229      |
|    total_timesteps | 1328     |
| train/             |          |
|    actor_loss      | -44.2    |
|    critic_loss     | 2.36e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.00977  |
|    learning_rate   | 0.0003   |
|    n_updates       | 153      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 4.97     |
|    ep_rew_mean     | 530      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 172      |
|    fps             | 5        |
|    time_elapsed    | 233      |
|    total_timesteps | 1336     |
| train/             |          |
|    actor_loss      | -45.6    |
|    critic_loss     | 1.78e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0108   |
|    learning_rate   | 0.0003   |
|    n_updates       | 154      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 4.66     |
|    ep_rew_mean     | 527      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 176      |
|    fps             | 5        |
|    time_elapsed    | 238      |
|    total_timesteps | 1352     |
| train/             |          |
|    actor_loss      | -48.1    |
|    critic_loss     | 2.6e+04  |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.00715  |
|    learning_rate   | 0.0003   |
|    n_updates       | 156      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 4.46     |
|    ep_rew_mean     | 525      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 180      |
|    fps             | 5        |
|    time_elapsed    | 242      |
|    total_timesteps | 1360     |
| train/             |          |
|    actor_loss      | -47.7    |
|    critic_loss     | 2.64e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0193   |
|    learning_rate   | 0.0003   |
|    n_updates       | 157      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 4.24     |
|    ep_rew_mean     | 523      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 184      |
|    fps             | 5        |
|    time_elapsed    | 247      |
|    total_timesteps | 1376     |
| train/             |          |
|    actor_loss      | -50.9    |
|    critic_loss     | 2.29e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0243   |
|    learning_rate   | 0.0003   |
|    n_updates       | 159      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.98     |
|    ep_rew_mean     | 521      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 188      |
|    fps             | 5        |
|    time_elapsed    | 251      |
|    total_timesteps | 1384     |
| train/             |          |
|    actor_loss      | -53.6    |
|    critic_loss     | 3.01e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0293   |
|    learning_rate   | 0.0003   |
|    n_updates       | 160      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.73     |
|    ep_rew_mean     | 519      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 192      |
|    fps             | 5        |
|    time_elapsed    | 256      |
|    total_timesteps | 1400     |
| train/             |          |
|    actor_loss      | -56.2    |
|    critic_loss     | 2.26e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0376   |
|    learning_rate   | 0.0003   |
|    n_updates       | 162      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.7      |
|    ep_rew_mean     | 519      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 196      |
|    fps             | 5        |
|    time_elapsed    | 261      |
|    total_timesteps | 1408     |
| train/             |          |
|    actor_loss      | -56.5    |
|    critic_loss     | 2.22e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0327   |
|    learning_rate   | 0.0003   |
|    n_updates       | 163      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.66     |
|    ep_rew_mean     | 518      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 200      |
|    fps             | 5        |
|    time_elapsed    | 265      |
|    total_timesteps | 1424     |
| train/             |          |
|    actor_loss      | -61.2    |
|    critic_loss     | 2.02e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0346   |
|    learning_rate   | 0.0003   |
|    n_updates       | 165      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.51     |
|    ep_rew_mean     | 517      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 204      |
|    fps             | 5        |
|    time_elapsed    | 270      |
|    total_timesteps | 1432     |
| train/             |          |
|    actor_loss      | -60.7    |
|    critic_loss     | 2.64e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0393   |
|    learning_rate   | 0.0003   |
|    n_updates       | 166      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.47     |
|    ep_rew_mean     | 517      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 208      |
|    fps             | 5        |
|    time_elapsed    | 275      |
|    total_timesteps | 1448     |
| train/             |          |
|    actor_loss      | -65.7    |
|    critic_loss     | 2.41e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0451   |
|    learning_rate   | 0.0003   |
|    n_updates       | 168      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.4      |
|    ep_rew_mean     | 516      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 212      |
|    fps             | 5        |
|    time_elapsed    | 279      |
|    total_timesteps | 1456     |
| train/             |          |
|    actor_loss      | -64.1    |
|    critic_loss     | 2.38e+04 |
|    ent_coef        | 0.96     |
|    ent_coef_loss   | 0.0443   |
|    learning_rate   | 0.0003   |
|    n_updates       | 169      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.34     |
|    ep_rew_mean     | 516      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 216      |
|    fps             | 5        |
|    time_elapsed    | 284      |
|    total_timesteps | 1472     |
| train/             |          |
|    actor_loss      | -68.7    |
|    critic_loss     | 2.72e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | 0.0554   |
|    learning_rate   | 0.0003   |
|    n_updates       | 171      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.3      |
|    ep_rew_mean     | 515      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 220      |
|    fps             | 5        |
|    time_elapsed    | 289      |
|    total_timesteps | 1480     |
| train/             |          |
|    actor_loss      | -68.5    |
|    critic_loss     | 3.15e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | 0.0548   |
|    learning_rate   | 0.0003   |
|    n_updates       | 172      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.25     |
|    ep_rew_mean     | 515      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 224      |
|    fps             | 5        |
|    time_elapsed    | 293      |
|    total_timesteps | 1496     |
| train/             |          |
|    actor_loss      | -70.3    |
|    critic_loss     | 2.17e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | 0.053    |
|    learning_rate   | 0.0003   |
|    n_updates       | 174      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.2      |
|    ep_rew_mean     | 514      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 228      |
|    fps             | 5        |
|    time_elapsed    | 298      |
|    total_timesteps | 1504     |
| train/             |          |
|    actor_loss      | -72.8    |
|    critic_loss     | 2.34e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | 0.0554   |
|    learning_rate   | 0.0003   |
|    n_updates       | 175      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.17     |
|    ep_rew_mean     | 513      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 232      |
|    fps             | 5        |
|    time_elapsed    | 303      |
|    total_timesteps | 1520     |
| train/             |          |
|    actor_loss      | -79.4    |
|    critic_loss     | 3.09e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | 0.066    |
|    learning_rate   | 0.0003   |
|    n_updates       | 177      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.11     |
|    ep_rew_mean     | 513      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 236      |
|    fps             | 4        |
|    time_elapsed    | 307      |
|    total_timesteps | 1528     |
| train/             |          |
|    actor_loss      | -78.3    |
|    critic_loss     | 2.65e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | 0.062    |
|    learning_rate   | 0.0003   |
|    n_updates       | 178      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.09     |
|    ep_rew_mean     | 513      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 240      |
|    fps             | 4        |
|    time_elapsed    | 312      |
|    total_timesteps | 1544     |
| train/             |          |
|    actor_loss      | -82.5    |
|    critic_loss     | 2.56e+04 |
|    ent_coef        | 0.961    |
|    ent_coef_loss   | 0.0665   |
|    learning_rate   | 0.0003   |
|    n_updates       | 180      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.08     |
|    ep_rew_mean     | 513      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 244      |
|    fps             | 4        |
|    time_elapsed    | 316      |
|    total_timesteps | 1552     |
| train/             |          |
|    actor_loss      | -87.2    |
|    critic_loss     | 2.26e+04 |
|    ent_coef        | 0.962    |
|    ent_coef_loss   | 0.0651   |
|    learning_rate   | 0.0003   |
|    n_updates       | 181      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.05     |
|    ep_rew_mean     | 512      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 248      |
|    fps             | 4        |
|    time_elapsed    | 321      |
|    total_timesteps | 1568     |
| train/             |          |
|    actor_loss      | -88.4    |
|    critic_loss     | 2.8e+04  |
|    ent_coef        | 0.962    |
|    ent_coef_loss   | 0.0763   |
|    learning_rate   | 0.0003   |
|    n_updates       | 183      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.04     |
|    ep_rew_mean     | 512      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 252      |
|    fps             | 4        |
|    time_elapsed    | 326      |
|    total_timesteps | 1576     |
| train/             |          |
|    actor_loss      | -93.3    |
|    critic_loss     | 3.21e+04 |
|    ent_coef        | 0.962    |
|    ent_coef_loss   | 0.0698   |
|    learning_rate   | 0.0003   |
|    n_updates       | 184      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.04     |
|    ep_rew_mean     | 512      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 256      |
|    fps             | 4        |
|    time_elapsed    | 331      |
|    total_timesteps | 1592     |
| train/             |          |
|    actor_loss      | -93      |
|    critic_loss     | 2.51e+04 |
|    ent_coef        | 0.962    |
|    ent_coef_loss   | 0.0764   |
|    learning_rate   | 0.0003   |
|    n_updates       | 186      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.04     |
|    ep_rew_mean     | 512      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 260      |
|    fps             | 4        |
|    time_elapsed    | 335      |
|    total_timesteps | 1600     |
| train/             |          |
|    actor_loss      | -94.3    |
|    critic_loss     | 2.51e+04 |
|    ent_coef        | 0.963    |
|    ent_coef_loss   | 0.078    |
|    learning_rate   | 0.0003   |
|    n_updates       | 187      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.03     |
|    ep_rew_mean     | 512      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 264      |
|    fps             | 4        |
|    time_elapsed    | 340      |
|    total_timesteps | 1616     |
| train/             |          |
|    actor_loss      | -97      |
|    critic_loss     | 1.97e+04 |
|    ent_coef        | 0.963    |
|    ent_coef_loss   | 0.0793   |
|    learning_rate   | 0.0003   |
|    n_updates       | 189      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.03     |
|    ep_rew_mean     | 512      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 268      |
|    fps             | 4        |
|    time_elapsed    | 344      |
|    total_timesteps | 1624     |
| train/             |          |
|    actor_loss      | -97.5    |
|    critic_loss     | 2.49e+04 |
|    ent_coef        | 0.963    |
|    ent_coef_loss   | 0.0679   |
|    learning_rate   | 0.0003   |
|    n_updates       | 190      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 512      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 272      |
|    fps             | 4        |
|    time_elapsed    | 349      |
|    total_timesteps | 1640     |
| train/             |          |
|    actor_loss      | -104     |
|    critic_loss     | 2.4e+04  |
|    ent_coef        | 0.963    |
|    ent_coef_loss   | 0.0799   |
|    learning_rate   | 0.0003   |
|    n_updates       | 192      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 512      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 276      |
|    fps             | 4        |
|    time_elapsed    | 354      |
|    total_timesteps | 1648     |
| train/             |          |
|    actor_loss      | -108     |
|    critic_loss     | 2.48e+04 |
|    ent_coef        | 0.964    |
|    ent_coef_loss   | 0.0736   |
|    learning_rate   | 0.0003   |
|    n_updates       | 193      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 280      |
|    fps             | 4        |
|    time_elapsed    | 359      |
|    total_timesteps | 1664     |
| train/             |          |
|    actor_loss      | -110     |
|    critic_loss     | 2.81e+04 |
|    ent_coef        | 0.964    |
|    ent_coef_loss   | 0.0884   |
|    learning_rate   | 0.0003   |
|    n_updates       | 195      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 284      |
|    fps             | 4        |
|    time_elapsed    | 363      |
|    total_timesteps | 1672     |
| train/             |          |
|    actor_loss      | -112     |
|    critic_loss     | 2.64e+04 |
|    ent_coef        | 0.964    |
|    ent_coef_loss   | 0.0811   |
|    learning_rate   | 0.0003   |
|    n_updates       | 196      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 288      |
|    fps             | 4        |
|    time_elapsed    | 368      |
|    total_timesteps | 1688     |
| train/             |          |
|    actor_loss      | -118     |
|    critic_loss     | 2.63e+04 |
|    ent_coef        | 0.965    |
|    ent_coef_loss   | 0.084    |
|    learning_rate   | 0.0003   |
|    n_updates       | 198      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 292      |
|    fps             | 4        |
|    time_elapsed    | 372      |
|    total_timesteps | 1696     |
| train/             |          |
|    actor_loss      | -121     |
|    critic_loss     | 2.72e+04 |
|    ent_coef        | 0.965    |
|    ent_coef_loss   | 0.0843   |
|    learning_rate   | 0.0003   |
|    n_updates       | 199      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 296      |
|    fps             | 4        |
|    time_elapsed    | 377      |
|    total_timesteps | 1712     |
| train/             |          |
|    actor_loss      | -123     |
|    critic_loss     | 2.52e+04 |
|    ent_coef        | 0.965    |
|    ent_coef_loss   | 0.0928   |
|    learning_rate   | 0.0003   |
|    n_updates       | 201      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 300      |
|    fps             | 4        |
|    time_elapsed    | 382      |
|    total_timesteps | 1720     |
| train/             |          |
|    actor_loss      | -124     |
|    critic_loss     | 2.61e+04 |
|    ent_coef        | 0.966    |
|    ent_coef_loss   | 0.0764   |
|    learning_rate   | 0.0003   |
|    n_updates       | 202      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 304      |
|    fps             | 4        |
|    time_elapsed    | 386      |
|    total_timesteps | 1736     |
| train/             |          |
|    actor_loss      | -124     |
|    critic_loss     | 2.19e+04 |
|    ent_coef        | 0.966    |
|    ent_coef_loss   | 0.0959   |
|    learning_rate   | 0.0003   |
|    n_updates       | 204      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 308      |
|    fps             | 4        |
|    time_elapsed    | 391      |
|    total_timesteps | 1744     |
| train/             |          |
|    actor_loss      | -127     |
|    critic_loss     | 2.11e+04 |
|    ent_coef        | 0.966    |
|    ent_coef_loss   | 0.0863   |
|    learning_rate   | 0.0003   |
|    n_updates       | 205      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 312      |
|    fps             | 4        |
|    time_elapsed    | 396      |
|    total_timesteps | 1760     |
| train/             |          |
|    actor_loss      | -125     |
|    critic_loss     | 1.77e+04 |
|    ent_coef        | 0.967    |
|    ent_coef_loss   | 0.0796   |
|    learning_rate   | 0.0003   |
|    n_updates       | 207      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 316      |
|    fps             | 4        |
|    time_elapsed    | 400      |
|    total_timesteps | 1768     |
| train/             |          |
|    actor_loss      | -124     |
|    critic_loss     | 2.27e+04 |
|    ent_coef        | 0.967    |
|    ent_coef_loss   | 0.0911   |
|    learning_rate   | 0.0003   |
|    n_updates       | 208      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 320      |
|    fps             | 4        |
|    time_elapsed    | 405      |
|    total_timesteps | 1784     |
| train/             |          |
|    actor_loss      | -127     |
|    critic_loss     | 1.72e+04 |
|    ent_coef        | 0.968    |
|    ent_coef_loss   | 0.0899   |
|    learning_rate   | 0.0003   |
|    n_updates       | 210      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 324      |
|    fps             | 4        |
|    time_elapsed    | 410      |
|    total_timesteps | 1792     |
| train/             |          |
|    actor_loss      | -133     |
|    critic_loss     | 2.31e+04 |
|    ent_coef        | 0.968    |
|    ent_coef_loss   | 0.09     |
|    learning_rate   | 0.0003   |
|    n_updates       | 211      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 328      |
|    fps             | 4        |
|    time_elapsed    | 414      |
|    total_timesteps | 1808     |
| train/             |          |
|    actor_loss      | -131     |
|    critic_loss     | 1.89e+04 |
|    ent_coef        | 0.968    |
|    ent_coef_loss   | 0.0868   |
|    learning_rate   | 0.0003   |
|    n_updates       | 213      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 332      |
|    fps             | 4        |
|    time_elapsed    | 419      |
|    total_timesteps | 1816     |
| train/             |          |
|    actor_loss      | -139     |
|    critic_loss     | 2.14e+04 |
|    ent_coef        | 0.969    |
|    ent_coef_loss   | 0.0803   |
|    learning_rate   | 0.0003   |
|    n_updates       | 214      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 336      |
|    fps             | 4        |
|    time_elapsed    | 428      |
|    total_timesteps | 1840     |
| train/             |          |
|    actor_loss      | -137     |
|    critic_loss     | 2.1e+04  |
|    ent_coef        | 0.969    |
|    ent_coef_loss   | 0.0732   |
|    learning_rate   | 0.0003   |
|    n_updates       | 217      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 340      |
|    fps             | 4        |
|    time_elapsed    | 428      |
|    total_timesteps | 1840     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 344      |
|    fps             | 4        |
|    time_elapsed    | 438      |
|    total_timesteps | 1864     |
| train/             |          |
|    actor_loss      | -135     |
|    critic_loss     | 2.39e+04 |
|    ent_coef        | 0.97     |
|    ent_coef_loss   | 0.0831   |
|    learning_rate   | 0.0003   |
|    n_updates       | 220      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 348      |
|    fps             | 4        |
|    time_elapsed    | 438      |
|    total_timesteps | 1864     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 352      |
|    fps             | 4        |
|    time_elapsed    | 447      |
|    total_timesteps | 1888     |
| train/             |          |
|    actor_loss      | -137     |
|    critic_loss     | 2.04e+04 |
|    ent_coef        | 0.971    |
|    ent_coef_loss   | 0.0768   |
|    learning_rate   | 0.0003   |
|    n_updates       | 223      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 356      |
|    fps             | 4        |
|    time_elapsed    | 447      |
|    total_timesteps | 1888     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 360      |
|    fps             | 4        |
|    time_elapsed    | 456      |
|    total_timesteps | 1912     |
| train/             |          |
|    actor_loss      | -131     |
|    critic_loss     | 2.39e+04 |
|    ent_coef        | 0.972    |
|    ent_coef_loss   | 0.0653   |
|    learning_rate   | 0.0003   |
|    n_updates       | 226      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 364      |
|    fps             | 4        |
|    time_elapsed    | 456      |
|    total_timesteps | 1912     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 368      |
|    fps             | 4        |
|    time_elapsed    | 465      |
|    total_timesteps | 1936     |
| train/             |          |
|    actor_loss      | -137     |
|    critic_loss     | 1.71e+04 |
|    ent_coef        | 0.973    |
|    ent_coef_loss   | 0.0677   |
|    learning_rate   | 0.0003   |
|    n_updates       | 229      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 372      |
|    fps             | 4        |
|    time_elapsed    | 465      |
|    total_timesteps | 1936     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 376      |
|    fps             | 4        |
|    time_elapsed    | 475      |
|    total_timesteps | 1960     |
| train/             |          |
|    actor_loss      | -142     |
|    critic_loss     | 2.06e+04 |
|    ent_coef        | 0.974    |
|    ent_coef_loss   | 0.0752   |
|    learning_rate   | 0.0003   |
|    n_updates       | 232      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 380      |
|    fps             | 4        |
|    time_elapsed    | 475      |
|    total_timesteps | 1960     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 384      |
|    fps             | 4        |
|    time_elapsed    | 484      |
|    total_timesteps | 1984     |
| train/             |          |
|    actor_loss      | -142     |
|    critic_loss     | 1.96e+04 |
|    ent_coef        | 0.975    |
|    ent_coef_loss   | 0.0652   |
|    learning_rate   | 0.0003   |
|    n_updates       | 235      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 388      |
|    fps             | 4        |
|    time_elapsed    | 484      |
|    total_timesteps | 1984     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 392      |
|    fps             | 4        |
|    time_elapsed    | 493      |
|    total_timesteps | 2008     |
| train/             |          |
|    actor_loss      | -138     |
|    critic_loss     | 1.78e+04 |
|    ent_coef        | 0.975    |
|    ent_coef_loss   | 0.0617   |
|    learning_rate   | 0.0003   |
|    n_updates       | 238      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 396      |
|    fps             | 4        |
|    time_elapsed    | 493      |
|    total_timesteps | 2008     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 400      |
|    fps             | 4        |
|    time_elapsed    | 502      |
|    total_timesteps | 2032     |
| train/             |          |
|    actor_loss      | -152     |
|    critic_loss     | 1.96e+04 |
|    ent_coef        | 0.976    |
|    ent_coef_loss   | 0.0625   |
|    learning_rate   | 0.0003   |
|    n_updates       | 241      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 404      |
|    fps             | 4        |
|    time_elapsed    | 502      |
|    total_timesteps | 2032     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 408      |
|    fps             | 4        |
|    time_elapsed    | 512      |
|    total_timesteps | 2056     |
| train/             |          |
|    actor_loss      | -151     |
|    critic_loss     | 1.9e+04  |
|    ent_coef        | 0.977    |
|    ent_coef_loss   | 0.0624   |
|    learning_rate   | 0.0003   |
|    n_updates       | 244      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 412      |
|    fps             | 4        |
|    time_elapsed    | 512      |
|    total_timesteps | 2056     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 416      |
|    fps             | 3        |
|    time_elapsed    | 521      |
|    total_timesteps | 2080     |
| train/             |          |
|    actor_loss      | -148     |
|    critic_loss     | 2.04e+04 |
|    ent_coef        | 0.978    |
|    ent_coef_loss   | 0.0598   |
|    learning_rate   | 0.0003   |
|    n_updates       | 247      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 420      |
|    fps             | 3        |
|    time_elapsed    | 521      |
|    total_timesteps | 2080     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 424      |
|    fps             | 3        |
|    time_elapsed    | 530      |
|    total_timesteps | 2104     |
| train/             |          |
|    actor_loss      | -152     |
|    critic_loss     | 1.93e+04 |
|    ent_coef        | 0.979    |
|    ent_coef_loss   | 0.0552   |
|    learning_rate   | 0.0003   |
|    n_updates       | 250      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 428      |
|    fps             | 3        |
|    time_elapsed    | 530      |
|    total_timesteps | 2104     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 432      |
|    fps             | 3        |
|    time_elapsed    | 540      |
|    total_timesteps | 2128     |
| train/             |          |
|    actor_loss      | -140     |
|    critic_loss     | 1.44e+04 |
|    ent_coef        | 0.98     |
|    ent_coef_loss   | 0.0522   |
|    learning_rate   | 0.0003   |
|    n_updates       | 253      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 436      |
|    fps             | 3        |
|    time_elapsed    | 540      |
|    total_timesteps | 2128     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 440      |
|    fps             | 3        |
|    time_elapsed    | 549      |
|    total_timesteps | 2152     |
| train/             |          |
|    actor_loss      | -161     |
|    critic_loss     | 1.91e+04 |
|    ent_coef        | 0.981    |
|    ent_coef_loss   | 0.0476   |
|    learning_rate   | 0.0003   |
|    n_updates       | 256      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 444      |
|    fps             | 3        |
|    time_elapsed    | 549      |
|    total_timesteps | 2152     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 448      |
|    fps             | 3        |
|    time_elapsed    | 559      |
|    total_timesteps | 2176     |
| train/             |          |
|    actor_loss      | -162     |
|    critic_loss     | 1.61e+04 |
|    ent_coef        | 0.981    |
|    ent_coef_loss   | 0.0507   |
|    learning_rate   | 0.0003   |
|    n_updates       | 259      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 452      |
|    fps             | 3        |
|    time_elapsed    | 559      |
|    total_timesteps | 2176     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 456      |
|    fps             | 3        |
|    time_elapsed    | 568      |
|    total_timesteps | 2200     |
| train/             |          |
|    actor_loss      | -155     |
|    critic_loss     | 1.58e+04 |
|    ent_coef        | 0.982    |
|    ent_coef_loss   | 0.0478   |
|    learning_rate   | 0.0003   |
|    n_updates       | 262      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 460      |
|    fps             | 3        |
|    time_elapsed    | 568      |
|    total_timesteps | 2200     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 464      |
|    fps             | 3        |
|    time_elapsed    | 578      |
|    total_timesteps | 2224     |
| train/             |          |
|    actor_loss      | -144     |
|    critic_loss     | 1.45e+04 |
|    ent_coef        | 0.983    |
|    ent_coef_loss   | 0.0437   |
|    learning_rate   | 0.0003   |
|    n_updates       | 265      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 468      |
|    fps             | 3        |
|    time_elapsed    | 578      |
|    total_timesteps | 2224     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 472      |
|    fps             | 3        |
|    time_elapsed    | 587      |
|    total_timesteps | 2248     |
| train/             |          |
|    actor_loss      | -149     |
|    critic_loss     | 2.26e+04 |
|    ent_coef        | 0.984    |
|    ent_coef_loss   | 0.0372   |
|    learning_rate   | 0.0003   |
|    n_updates       | 268      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 476      |
|    fps             | 3        |
|    time_elapsed    | 587      |
|    total_timesteps | 2248     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 480      |
|    fps             | 3        |
|    time_elapsed    | 597      |
|    total_timesteps | 2272     |
| train/             |          |
|    actor_loss      | -159     |
|    critic_loss     | 1.87e+04 |
|    ent_coef        | 0.985    |
|    ent_coef_loss   | 0.0332   |
|    learning_rate   | 0.0003   |
|    n_updates       | 271      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 484      |
|    fps             | 3        |
|    time_elapsed    | 597      |
|    total_timesteps | 2272     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 488      |
|    fps             | 3        |
|    time_elapsed    | 606      |
|    total_timesteps | 2296     |
| train/             |          |
|    actor_loss      | -162     |
|    critic_loss     | 1.48e+04 |
|    ent_coef        | 0.986    |
|    ent_coef_loss   | 0.0366   |
|    learning_rate   | 0.0003   |
|    n_updates       | 274      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 492      |
|    fps             | 3        |
|    time_elapsed    | 606      |
|    total_timesteps | 2296     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 496      |
|    fps             | 3        |
|    time_elapsed    | 616      |
|    total_timesteps | 2320     |
| train/             |          |
|    actor_loss      | -156     |
|    critic_loss     | 1.67e+04 |
|    ent_coef        | 0.987    |
|    ent_coef_loss   | 0.0364   |
|    learning_rate   | 0.0003   |
|    n_updates       | 277      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 500      |
|    fps             | 3        |
|    time_elapsed    | 616      |
|    total_timesteps | 2320     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 504      |
|    fps             | 3        |
|    time_elapsed    | 625      |
|    total_timesteps | 2344     |
| train/             |          |
|    actor_loss      | -148     |
|    critic_loss     | 1.49e+04 |
|    ent_coef        | 0.987    |
|    ent_coef_loss   | 0.0313   |
|    learning_rate   | 0.0003   |
|    n_updates       | 280      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 508      |
|    fps             | 3        |
|    time_elapsed    | 625      |
|    total_timesteps | 2344     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 512      |
|    fps             | 3        |
|    time_elapsed    | 635      |
|    total_timesteps | 2368     |
| train/             |          |
|    actor_loss      | -168     |
|    critic_loss     | 1.87e+04 |
|    ent_coef        | 0.988    |
|    ent_coef_loss   | 0.023    |
|    learning_rate   | 0.0003   |
|    n_updates       | 283      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 516      |
|    fps             | 3        |
|    time_elapsed    | 635      |
|    total_timesteps | 2368     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 520      |
|    fps             | 3        |
|    time_elapsed    | 644      |
|    total_timesteps | 2392     |
| train/             |          |
|    actor_loss      | -175     |
|    critic_loss     | 1.75e+04 |
|    ent_coef        | 0.989    |
|    ent_coef_loss   | 0.0268   |
|    learning_rate   | 0.0003   |
|    n_updates       | 286      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 524      |
|    fps             | 3        |
|    time_elapsed    | 644      |
|    total_timesteps | 2392     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 528      |
|    fps             | 3        |
|    time_elapsed    | 653      |
|    total_timesteps | 2416     |
| train/             |          |
|    actor_loss      | -183     |
|    critic_loss     | 1.61e+04 |
|    ent_coef        | 0.99     |
|    ent_coef_loss   | 0.0267   |
|    learning_rate   | 0.0003   |
|    n_updates       | 289      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 532      |
|    fps             | 3        |
|    time_elapsed    | 654      |
|    total_timesteps | 2416     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 536      |
|    fps             | 3        |
|    time_elapsed    | 663      |
|    total_timesteps | 2440     |
| train/             |          |
|    actor_loss      | -170     |
|    critic_loss     | 1.31e+04 |
|    ent_coef        | 0.991    |
|    ent_coef_loss   | 0.0245   |
|    learning_rate   | 0.0003   |
|    n_updates       | 292      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 540      |
|    fps             | 3        |
|    time_elapsed    | 663      |
|    total_timesteps | 2440     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 544      |
|    fps             | 3        |
|    time_elapsed    | 672      |
|    total_timesteps | 2464     |
| train/             |          |
|    actor_loss      | -168     |
|    critic_loss     | 1.44e+04 |
|    ent_coef        | 0.992    |
|    ent_coef_loss   | 0.0192   |
|    learning_rate   | 0.0003   |
|    n_updates       | 295      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 548      |
|    fps             | 3        |
|    time_elapsed    | 672      |
|    total_timesteps | 2464     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 552      |
|    fps             | 3        |
|    time_elapsed    | 682      |
|    total_timesteps | 2488     |
| train/             |          |
|    actor_loss      | -165     |
|    critic_loss     | 1.22e+04 |
|    ent_coef        | 0.992    |
|    ent_coef_loss   | 0.0181   |
|    learning_rate   | 0.0003   |
|    n_updates       | 298      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 556      |
|    fps             | 3        |
|    time_elapsed    | 682      |
|    total_timesteps | 2488     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 560      |
|    fps             | 3        |
|    time_elapsed    | 692      |
|    total_timesteps | 2512     |
| train/             |          |
|    actor_loss      | -174     |
|    critic_loss     | 1.27e+04 |
|    ent_coef        | 0.993    |
|    ent_coef_loss   | 0.0167   |
|    learning_rate   | 0.0003   |
|    n_updates       | 301      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 564      |
|    fps             | 3        |
|    time_elapsed    | 692      |
|    total_timesteps | 2512     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 568      |
|    fps             | 3        |
|    time_elapsed    | 702      |
|    total_timesteps | 2536     |
| train/             |          |
|    actor_loss      | -168     |
|    critic_loss     | 1.49e+04 |
|    ent_coef        | 0.994    |
|    ent_coef_loss   | 0.0147   |
|    learning_rate   | 0.0003   |
|    n_updates       | 304      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 572      |
|    fps             | 3        |
|    time_elapsed    | 702      |
|    total_timesteps | 2536     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 576      |
|    fps             | 3        |
|    time_elapsed    | 712      |
|    total_timesteps | 2560     |
| train/             |          |
|    actor_loss      | -165     |
|    critic_loss     | 1.24e+04 |
|    ent_coef        | 0.995    |
|    ent_coef_loss   | 0.0135   |
|    learning_rate   | 0.0003   |
|    n_updates       | 307      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 580      |
|    fps             | 3        |
|    time_elapsed    | 712      |
|    total_timesteps | 2560     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 584      |
|    fps             | 3        |
|    time_elapsed    | 723      |
|    total_timesteps | 2584     |
| train/             |          |
|    actor_loss      | -173     |
|    critic_loss     | 1.32e+04 |
|    ent_coef        | 0.996    |
|    ent_coef_loss   | 0.00986  |
|    learning_rate   | 0.0003   |
|    n_updates       | 310      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 588      |
|    fps             | 3        |
|    time_elapsed    | 723      |
|    total_timesteps | 2584     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 592      |
|    fps             | 3        |
|    time_elapsed    | 732      |
|    total_timesteps | 2608     |
| train/             |          |
|    actor_loss      | -172     |
|    critic_loss     | 1.13e+04 |
|    ent_coef        | 0.996    |
|    ent_coef_loss   | 0.0078   |
|    learning_rate   | 0.0003   |
|    n_updates       | 313      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 596      |
|    fps             | 3        |
|    time_elapsed    | 732      |
|    total_timesteps | 2608     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 600      |
|    fps             | 3        |
|    time_elapsed    | 742      |
|    total_timesteps | 2632     |
| train/             |          |
|    actor_loss      | -160     |
|    critic_loss     | 1.03e+04 |
|    ent_coef        | 0.997    |
|    ent_coef_loss   | 0.00656  |
|    learning_rate   | 0.0003   |
|    n_updates       | 316      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 604      |
|    fps             | 3        |
|    time_elapsed    | 742      |
|    total_timesteps | 2632     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 608      |
|    fps             | 3        |
|    time_elapsed    | 752      |
|    total_timesteps | 2656     |
| train/             |          |
|    actor_loss      | -187     |
|    critic_loss     | 1.23e+04 |
|    ent_coef        | 0.998    |
|    ent_coef_loss   | 0.00508  |
|    learning_rate   | 0.0003   |
|    n_updates       | 319      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 612      |
|    fps             | 3        |
|    time_elapsed    | 752      |
|    total_timesteps | 2656     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 616      |
|    fps             | 3        |
|    time_elapsed    | 762      |
|    total_timesteps | 2680     |
| train/             |          |
|    actor_loss      | -176     |
|    critic_loss     | 1.09e+04 |
|    ent_coef        | 0.999    |
|    ent_coef_loss   | 0.00242  |
|    learning_rate   | 0.0003   |
|    n_updates       | 322      |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 620      |
|    fps             | 3        |
|    time_elapsed    | 762      |
|    total_timesteps | 2680     |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 624      |
|    fps             | 3        |
|    time_elapsed    | 770      |
|    total_timesteps | 2704     |
| train/             |          |
|    actor_loss      | -183     |
|    critic_loss     | 1.22e+04 |
|    ent_coef        | 1        |
|    ent_coef_loss   | 0.000815 |
|    learning_rate   | 0.0003   |
|    n_updates       | 325      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 628      |
|    fps             | 3        |
|    time_elapsed    | 774      |
|    total_timesteps | 2712     |
| train/             |          |
|    actor_loss      | -174     |
|    critic_loss     | 1.18e+04 |
|    ent_coef        | 1        |
|    ent_coef_loss   | 0.000186 |
|    learning_rate   | 0.0003   |
|    n_updates       | 326      |
---------------------------------


----------------------------------
| rollout/           |           |
|    ep_len_mean     | 3.01      |
|    ep_rew_mean     | 511       |
|    success_rate    | 0         |
| time/              |           |
|    episodes        | 632       |
|    fps             | 3         |
|    time_elapsed    | 780       |
|    total_timesteps | 2728      |
| train/             |           |
|    actor_loss      | -173      |
|    critic_loss     | 9.62e+03  |
|    ent_coef        | 1         |
|    ent_coef_loss   | -0.000966 |
|    learning_rate   | 0.0003    |
|    n_updates       | 328       |
----------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 636      |
|    fps             | 3        |
|    time_elapsed    | 784      |
|    total_timesteps | 2736     |
| train/             |          |
|    actor_loss      | -183     |
|    critic_loss     | 9.42e+03 |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.00162 |
|    learning_rate   | 0.0003   |
|    n_updates       | 329      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 640      |
|    fps             | 3        |
|    time_elapsed    | 790      |
|    total_timesteps | 2752     |
| train/             |          |
|    actor_loss      | -179     |
|    critic_loss     | 1.4e+04  |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.00247 |
|    learning_rate   | 0.0003   |
|    n_updates       | 331      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 644      |
|    fps             | 3        |
|    time_elapsed    | 793      |
|    total_timesteps | 2760     |
| train/             |          |
|    actor_loss      | -174     |
|    critic_loss     | 8.15e+03 |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.00283 |
|    learning_rate   | 0.0003   |
|    n_updates       | 332      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 648      |
|    fps             | 3        |
|    time_elapsed    | 799      |
|    total_timesteps | 2776     |
| train/             |          |
|    actor_loss      | -164     |
|    critic_loss     | 1.49e+04 |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.0044  |
|    learning_rate   | 0.0003   |
|    n_updates       | 334      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 652      |
|    fps             | 3        |
|    time_elapsed    | 803      |
|    total_timesteps | 2784     |
| train/             |          |
|    actor_loss      | -176     |
|    critic_loss     | 1.36e+04 |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.00468 |
|    learning_rate   | 0.0003   |
|    n_updates       | 335      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 656      |
|    fps             | 3        |
|    time_elapsed    | 809      |
|    total_timesteps | 2800     |
| train/             |          |
|    actor_loss      | -183     |
|    critic_loss     | 1.01e+04 |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.00582 |
|    learning_rate   | 0.0003   |
|    n_updates       | 337      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 660      |
|    fps             | 3        |
|    time_elapsed    | 813      |
|    total_timesteps | 2808     |
| train/             |          |
|    actor_loss      | -164     |
|    critic_loss     | 7.74e+03 |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.0066  |
|    learning_rate   | 0.0003   |
|    n_updates       | 338      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 664      |
|    fps             | 3        |
|    time_elapsed    | 819      |
|    total_timesteps | 2824     |
| train/             |          |
|    actor_loss      | -177     |
|    critic_loss     | 1.04e+04 |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.00843 |
|    learning_rate   | 0.0003   |
|    n_updates       | 340      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 668      |
|    fps             | 3        |
|    time_elapsed    | 823      |
|    total_timesteps | 2832     |
| train/             |          |
|    actor_loss      | -178     |
|    critic_loss     | 1.01e+04 |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.00856 |
|    learning_rate   | 0.0003   |
|    n_updates       | 341      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 672      |
|    fps             | 3        |
|    time_elapsed    | 829      |
|    total_timesteps | 2848     |
| train/             |          |
|    actor_loss      | -159     |
|    critic_loss     | 7.7e+03  |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.00913 |
|    learning_rate   | 0.0003   |
|    n_updates       | 343      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 676      |
|    fps             | 3        |
|    time_elapsed    | 833      |
|    total_timesteps | 2856     |
| train/             |          |
|    actor_loss      | -179     |
|    critic_loss     | 8.8e+03  |
|    ent_coef        | 1        |
|    ent_coef_loss   | -0.0093  |
|    learning_rate   | 0.0003   |
|    n_updates       | 344      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 680      |
|    fps             | 3        |
|    time_elapsed    | 839      |
|    total_timesteps | 2872     |
| train/             |          |
|    actor_loss      | -169     |
|    critic_loss     | 8.18e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.00972 |
|    learning_rate   | 0.0003   |
|    n_updates       | 346      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 684      |
|    fps             | 3        |
|    time_elapsed    | 842      |
|    total_timesteps | 2880     |
| train/             |          |
|    actor_loss      | -189     |
|    critic_loss     | 9.51e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0102  |
|    learning_rate   | 0.0003   |
|    n_updates       | 347      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 688      |
|    fps             | 3        |
|    time_elapsed    | 849      |
|    total_timesteps | 2896     |
| train/             |          |
|    actor_loss      | -163     |
|    critic_loss     | 8.39e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0116  |
|    learning_rate   | 0.0003   |
|    n_updates       | 349      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 692      |
|    fps             | 3        |
|    time_elapsed    | 852      |
|    total_timesteps | 2904     |
| train/             |          |
|    actor_loss      | -188     |
|    critic_loss     | 7.11e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0122  |
|    learning_rate   | 0.0003   |
|    n_updates       | 350      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 696      |
|    fps             | 3        |
|    time_elapsed    | 858      |
|    total_timesteps | 2920     |
| train/             |          |
|    actor_loss      | -179     |
|    critic_loss     | 9.41e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0127  |
|    learning_rate   | 0.0003   |
|    n_updates       | 352      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 700      |
|    fps             | 3        |
|    time_elapsed    | 862      |
|    total_timesteps | 2928     |
| train/             |          |
|    actor_loss      | -166     |
|    critic_loss     | 7.99e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0149  |
|    learning_rate   | 0.0003   |
|    n_updates       | 353      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 704      |
|    fps             | 3        |
|    time_elapsed    | 868      |
|    total_timesteps | 2944     |
| train/             |          |
|    actor_loss      | -190     |
|    critic_loss     | 1.06e+04 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.016   |
|    learning_rate   | 0.0003   |
|    n_updates       | 355      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 708      |
|    fps             | 3        |
|    time_elapsed    | 872      |
|    total_timesteps | 2952     |
| train/             |          |
|    actor_loss      | -186     |
|    critic_loss     | 7.93e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0167  |
|    learning_rate   | 0.0003   |
|    n_updates       | 356      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 712      |
|    fps             | 3        |
|    time_elapsed    | 878      |
|    total_timesteps | 2968     |
| train/             |          |
|    actor_loss      | -176     |
|    critic_loss     | 1.1e+04  |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0157  |
|    learning_rate   | 0.0003   |
|    n_updates       | 358      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 716      |
|    fps             | 3        |
|    time_elapsed    | 882      |
|    total_timesteps | 2976     |
| train/             |          |
|    actor_loss      | -175     |
|    critic_loss     | 1.07e+04 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0163  |
|    learning_rate   | 0.0003   |
|    n_updates       | 359      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 720      |
|    fps             | 3        |
|    time_elapsed    | 888      |
|    total_timesteps | 2992     |
| train/             |          |
|    actor_loss      | -180     |
|    critic_loss     | 1.05e+04 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0166  |
|    learning_rate   | 0.0003   |
|    n_updates       | 361      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3.01     |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 724      |
|    fps             | 3        |
|    time_elapsed    | 891      |
|    total_timesteps | 3000     |
| train/             |          |
|    actor_loss      | -185     |
|    critic_loss     | 5.91e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0189  |
|    learning_rate   | 0.0003   |
|    n_updates       | 362      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 728      |
|    fps             | 3        |
|    time_elapsed    | 897      |
|    total_timesteps | 3016     |
| train/             |          |
|    actor_loss      | -179     |
|    critic_loss     | 7.11e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0168  |
|    learning_rate   | 0.0003   |
|    n_updates       | 364      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 732      |
|    fps             | 3        |
|    time_elapsed    | 901      |
|    total_timesteps | 3024     |
| train/             |          |
|    actor_loss      | -186     |
|    critic_loss     | 9.98e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0173  |
|    learning_rate   | 0.0003   |
|    n_updates       | 365      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 736      |
|    fps             | 3        |
|    time_elapsed    | 907      |
|    total_timesteps | 3040     |
| train/             |          |
|    actor_loss      | -191     |
|    critic_loss     | 6.71e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0217  |
|    learning_rate   | 0.0003   |
|    n_updates       | 367      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 740      |
|    fps             | 3        |
|    time_elapsed    | 911      |
|    total_timesteps | 3048     |
| train/             |          |
|    actor_loss      | -184     |
|    critic_loss     | 7.72e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0212  |
|    learning_rate   | 0.0003   |
|    n_updates       | 368      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 744      |
|    fps             | 3        |
|    time_elapsed    | 918      |
|    total_timesteps | 3064     |
| train/             |          |
|    actor_loss      | -190     |
|    critic_loss     | 5.42e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0252  |
|    learning_rate   | 0.0003   |
|    n_updates       | 370      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 748      |
|    fps             | 3        |
|    time_elapsed    | 921      |
|    total_timesteps | 3072     |
| train/             |          |
|    actor_loss      | -181     |
|    critic_loss     | 5.16e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0237  |
|    learning_rate   | 0.0003   |
|    n_updates       | 371      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 752      |
|    fps             | 3        |
|    time_elapsed    | 928      |
|    total_timesteps | 3088     |
| train/             |          |
|    actor_loss      | -201     |
|    critic_loss     | 9.48e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0243  |
|    learning_rate   | 0.0003   |
|    n_updates       | 373      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 756      |
|    fps             | 3        |
|    time_elapsed    | 931      |
|    total_timesteps | 3096     |
| train/             |          |
|    actor_loss      | -194     |
|    critic_loss     | 8.62e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.029   |
|    learning_rate   | 0.0003   |
|    n_updates       | 374      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 760      |
|    fps             | 3        |
|    time_elapsed    | 938      |
|    total_timesteps | 3112     |
| train/             |          |
|    actor_loss      | -201     |
|    critic_loss     | 6.83e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0265  |
|    learning_rate   | 0.0003   |
|    n_updates       | 376      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 764      |
|    fps             | 3        |
|    time_elapsed    | 942      |
|    total_timesteps | 3120     |
| train/             |          |
|    actor_loss      | -187     |
|    critic_loss     | 7.73e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0249  |
|    learning_rate   | 0.0003   |
|    n_updates       | 377      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 768      |
|    fps             | 3        |
|    time_elapsed    | 948      |
|    total_timesteps | 3136     |
| train/             |          |
|    actor_loss      | -187     |
|    critic_loss     | 8.16e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0271  |
|    learning_rate   | 0.0003   |
|    n_updates       | 379      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 772      |
|    fps             | 3        |
|    time_elapsed    | 952      |
|    total_timesteps | 3144     |
| train/             |          |
|    actor_loss      | -208     |
|    critic_loss     | 8.6e+03  |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0253  |
|    learning_rate   | 0.0003   |
|    n_updates       | 380      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 776      |
|    fps             | 3        |
|    time_elapsed    | 958      |
|    total_timesteps | 3160     |
| train/             |          |
|    actor_loss      | -198     |
|    critic_loss     | 7.29e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0309  |
|    learning_rate   | 0.0003   |
|    n_updates       | 382      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 780      |
|    fps             | 3        |
|    time_elapsed    | 961      |
|    total_timesteps | 3168     |
| train/             |          |
|    actor_loss      | -202     |
|    critic_loss     | 7.43e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0334  |
|    learning_rate   | 0.0003   |
|    n_updates       | 383      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 784      |
|    fps             | 3        |
|    time_elapsed    | 968      |
|    total_timesteps | 3184     |
| train/             |          |
|    actor_loss      | -186     |
|    critic_loss     | 7.27e+03 |
|    ent_coef        | 1.01     |
|    ent_coef_loss   | -0.0369  |
|    learning_rate   | 0.0003   |
|    n_updates       | 385      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 788      |
|    fps             | 3        |
|    time_elapsed    | 971      |
|    total_timesteps | 3192     |
| train/             |          |
|    actor_loss      | -201     |
|    critic_loss     | 7.35e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0348  |
|    learning_rate   | 0.0003   |
|    n_updates       | 386      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 792      |
|    fps             | 3        |
|    time_elapsed    | 977      |
|    total_timesteps | 3208     |
| train/             |          |
|    actor_loss      | -200     |
|    critic_loss     | 8.01e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0401  |
|    learning_rate   | 0.0003   |
|    n_updates       | 388      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 796      |
|    fps             | 3        |
|    time_elapsed    | 981      |
|    total_timesteps | 3216     |
| train/             |          |
|    actor_loss      | -198     |
|    critic_loss     | 4.08e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0303  |
|    learning_rate   | 0.0003   |
|    n_updates       | 389      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 800      |
|    fps             | 3        |
|    time_elapsed    | 987      |
|    total_timesteps | 3232     |
| train/             |          |
|    actor_loss      | -205     |
|    critic_loss     | 6.92e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0419  |
|    learning_rate   | 0.0003   |
|    n_updates       | 391      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 804      |
|    fps             | 3        |
|    time_elapsed    | 990      |
|    total_timesteps | 3240     |
| train/             |          |
|    actor_loss      | -207     |
|    critic_loss     | 5.86e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.034   |
|    learning_rate   | 0.0003   |
|    n_updates       | 392      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 808      |
|    fps             | 3        |
|    time_elapsed    | 996      |
|    total_timesteps | 3256     |
| train/             |          |
|    actor_loss      | -204     |
|    critic_loss     | 5.74e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0368  |
|    learning_rate   | 0.0003   |
|    n_updates       | 394      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 812      |
|    fps             | 3        |
|    time_elapsed    | 1000     |
|    total_timesteps | 3264     |
| train/             |          |
|    actor_loss      | -188     |
|    critic_loss     | 5.25e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0414  |
|    learning_rate   | 0.0003   |
|    n_updates       | 395      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 816      |
|    fps             | 3        |
|    time_elapsed    | 1006     |
|    total_timesteps | 3280     |
| train/             |          |
|    actor_loss      | -198     |
|    critic_loss     | 5.58e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0422  |
|    learning_rate   | 0.0003   |
|    n_updates       | 397      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 820      |
|    fps             | 3        |
|    time_elapsed    | 1009     |
|    total_timesteps | 3288     |
| train/             |          |
|    actor_loss      | -197     |
|    critic_loss     | 6.27e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0419  |
|    learning_rate   | 0.0003   |
|    n_updates       | 398      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 824      |
|    fps             | 3        |
|    time_elapsed    | 1015     |
|    total_timesteps | 3304     |
| train/             |          |
|    actor_loss      | -185     |
|    critic_loss     | 4.74e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0406  |
|    learning_rate   | 0.0003   |
|    n_updates       | 400      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 828      |
|    fps             | 3        |
|    time_elapsed    | 1019     |
|    total_timesteps | 3312     |
| train/             |          |
|    actor_loss      | -210     |
|    critic_loss     | 6.26e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0489  |
|    learning_rate   | 0.0003   |
|    n_updates       | 401      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 832      |
|    fps             | 3        |
|    time_elapsed    | 1025     |
|    total_timesteps | 3328     |
| train/             |          |
|    actor_loss      | -184     |
|    critic_loss     | 6.67e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0528  |
|    learning_rate   | 0.0003   |
|    n_updates       | 403      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 836      |
|    fps             | 3        |
|    time_elapsed    | 1028     |
|    total_timesteps | 3336     |
| train/             |          |
|    actor_loss      | -202     |
|    critic_loss     | 4.77e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0559  |
|    learning_rate   | 0.0003   |
|    n_updates       | 404      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 840      |
|    fps             | 3        |
|    time_elapsed    | 1034     |
|    total_timesteps | 3352     |
| train/             |          |
|    actor_loss      | -204     |
|    critic_loss     | 6.07e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0572  |
|    learning_rate   | 0.0003   |
|    n_updates       | 406      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 844      |
|    fps             | 3        |
|    time_elapsed    | 1038     |
|    total_timesteps | 3360     |
| train/             |          |
|    actor_loss      | -208     |
|    critic_loss     | 5.44e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0484  |
|    learning_rate   | 0.0003   |
|    n_updates       | 407      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 848      |
|    fps             | 3        |
|    time_elapsed    | 1044     |
|    total_timesteps | 3376     |
| train/             |          |
|    actor_loss      | -211     |
|    critic_loss     | 7.7e+03  |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0432  |
|    learning_rate   | 0.0003   |
|    n_updates       | 409      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 852      |
|    fps             | 3        |
|    time_elapsed    | 1047     |
|    total_timesteps | 3384     |
| train/             |          |
|    actor_loss      | -208     |
|    critic_loss     | 6.12e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0442  |
|    learning_rate   | 0.0003   |
|    n_updates       | 410      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 856      |
|    fps             | 3        |
|    time_elapsed    | 1054     |
|    total_timesteps | 3400     |
| train/             |          |
|    actor_loss      | -212     |
|    critic_loss     | 7.86e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0508  |
|    learning_rate   | 0.0003   |
|    n_updates       | 412      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 860      |
|    fps             | 3        |
|    time_elapsed    | 1057     |
|    total_timesteps | 3408     |
| train/             |          |
|    actor_loss      | -203     |
|    critic_loss     | 3.44e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0579  |
|    learning_rate   | 0.0003   |
|    n_updates       | 413      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 864      |
|    fps             | 3        |
|    time_elapsed    | 1063     |
|    total_timesteps | 3424     |
| train/             |          |
|    actor_loss      | -213     |
|    critic_loss     | 6.04e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0611  |
|    learning_rate   | 0.0003   |
|    n_updates       | 415      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 868      |
|    fps             | 3        |
|    time_elapsed    | 1067     |
|    total_timesteps | 3432     |
| train/             |          |
|    actor_loss      | -205     |
|    critic_loss     | 5.59e+03 |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0624  |
|    learning_rate   | 0.0003   |
|    n_updates       | 416      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 872      |
|    fps             | 3        |
|    time_elapsed    | 1073     |
|    total_timesteps | 3448     |
| train/             |          |
|    actor_loss      | -219     |
|    critic_loss     | 5.8e+03  |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0643  |
|    learning_rate   | 0.0003   |
|    n_updates       | 418      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 876      |
|    fps             | 3        |
|    time_elapsed    | 1076     |
|    total_timesteps | 3456     |
| train/             |          |
|    actor_loss      | -204     |
|    critic_loss     | 3.7e+03  |
|    ent_coef        | 1.02     |
|    ent_coef_loss   | -0.0676  |
|    learning_rate   | 0.0003   |
|    n_updates       | 419      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 880      |
|    fps             | 3        |
|    time_elapsed    | 1082     |
|    total_timesteps | 3472     |
| train/             |          |
|    actor_loss      | -220     |
|    critic_loss     | 4.38e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0587  |
|    learning_rate   | 0.0003   |
|    n_updates       | 421      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 884      |
|    fps             | 3        |
|    time_elapsed    | 1086     |
|    total_timesteps | 3480     |
| train/             |          |
|    actor_loss      | -218     |
|    critic_loss     | 4.57e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0603  |
|    learning_rate   | 0.0003   |
|    n_updates       | 422      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 888      |
|    fps             | 3        |
|    time_elapsed    | 1092     |
|    total_timesteps | 3496     |
| train/             |          |
|    actor_loss      | -220     |
|    critic_loss     | 5.17e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0638  |
|    learning_rate   | 0.0003   |
|    n_updates       | 424      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 892      |
|    fps             | 3        |
|    time_elapsed    | 1095     |
|    total_timesteps | 3504     |
| train/             |          |
|    actor_loss      | -206     |
|    critic_loss     | 4.68e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0643  |
|    learning_rate   | 0.0003   |
|    n_updates       | 425      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 896      |
|    fps             | 3        |
|    time_elapsed    | 1101     |
|    total_timesteps | 3520     |
| train/             |          |
|    actor_loss      | -235     |
|    critic_loss     | 6.38e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0696  |
|    learning_rate   | 0.0003   |
|    n_updates       | 427      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 900      |
|    fps             | 3        |
|    time_elapsed    | 1105     |
|    total_timesteps | 3528     |
| train/             |          |
|    actor_loss      | -218     |
|    critic_loss     | 6.44e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0761  |
|    learning_rate   | 0.0003   |
|    n_updates       | 428      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 904      |
|    fps             | 3        |
|    time_elapsed    | 1110     |
|    total_timesteps | 3544     |
| train/             |          |
|    actor_loss      | -217     |
|    critic_loss     | 5.78e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0719  |
|    learning_rate   | 0.0003   |
|    n_updates       | 430      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 908      |
|    fps             | 3        |
|    time_elapsed    | 1114     |
|    total_timesteps | 3552     |
| train/             |          |
|    actor_loss      | -220     |
|    critic_loss     | 3.96e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0825  |
|    learning_rate   | 0.0003   |
|    n_updates       | 431      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 912      |
|    fps             | 3        |
|    time_elapsed    | 1120     |
|    total_timesteps | 3568     |
| train/             |          |
|    actor_loss      | -211     |
|    critic_loss     | 5.12e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0779  |
|    learning_rate   | 0.0003   |
|    n_updates       | 433      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 916      |
|    fps             | 3        |
|    time_elapsed    | 1123     |
|    total_timesteps | 3576     |
| train/             |          |
|    actor_loss      | -219     |
|    critic_loss     | 5.97e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0738  |
|    learning_rate   | 0.0003   |
|    n_updates       | 434      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 920      |
|    fps             | 3        |
|    time_elapsed    | 1129     |
|    total_timesteps | 3592     |
| train/             |          |
|    actor_loss      | -215     |
|    critic_loss     | 6.66e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0823  |
|    learning_rate   | 0.0003   |
|    n_updates       | 436      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 924      |
|    fps             | 3        |
|    time_elapsed    | 1133     |
|    total_timesteps | 3600     |
| train/             |          |
|    actor_loss      | -229     |
|    critic_loss     | 7.71e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.083   |
|    learning_rate   | 0.0003   |
|    n_updates       | 437      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 928      |
|    fps             | 3        |
|    time_elapsed    | 1139     |
|    total_timesteps | 3616     |
| train/             |          |
|    actor_loss      | -230     |
|    critic_loss     | 6.29e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0899  |
|    learning_rate   | 0.0003   |
|    n_updates       | 439      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 932      |
|    fps             | 3        |
|    time_elapsed    | 1142     |
|    total_timesteps | 3624     |
| train/             |          |
|    actor_loss      | -227     |
|    critic_loss     | 5.54e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0818  |
|    learning_rate   | 0.0003   |
|    n_updates       | 440      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 936      |
|    fps             | 3        |
|    time_elapsed    | 1148     |
|    total_timesteps | 3640     |
| train/             |          |
|    actor_loss      | -223     |
|    critic_loss     | 4.79e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0811  |
|    learning_rate   | 0.0003   |
|    n_updates       | 442      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 940      |
|    fps             | 3        |
|    time_elapsed    | 1151     |
|    total_timesteps | 3648     |
| train/             |          |
|    actor_loss      | -223     |
|    critic_loss     | 9.57e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0851  |
|    learning_rate   | 0.0003   |
|    n_updates       | 443      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 944      |
|    fps             | 3        |
|    time_elapsed    | 1157     |
|    total_timesteps | 3664     |
| train/             |          |
|    actor_loss      | -242     |
|    critic_loss     | 7.52e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.088   |
|    learning_rate   | 0.0003   |
|    n_updates       | 445      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 948      |
|    fps             | 3        |
|    time_elapsed    | 1161     |
|    total_timesteps | 3672     |
| train/             |          |
|    actor_loss      | -230     |
|    critic_loss     | 5.17e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0929  |
|    learning_rate   | 0.0003   |
|    n_updates       | 446      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 952      |
|    fps             | 3        |
|    time_elapsed    | 1167     |
|    total_timesteps | 3688     |
| train/             |          |
|    actor_loss      | -217     |
|    critic_loss     | 4.75e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0984  |
|    learning_rate   | 0.0003   |
|    n_updates       | 448      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 956      |
|    fps             | 3        |
|    time_elapsed    | 1170     |
|    total_timesteps | 3696     |
| train/             |          |
|    actor_loss      | -222     |
|    critic_loss     | 6.16e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.105   |
|    learning_rate   | 0.0003   |
|    n_updates       | 449      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 960      |
|    fps             | 3        |
|    time_elapsed    | 1176     |
|    total_timesteps | 3712     |
| train/             |          |
|    actor_loss      | -232     |
|    critic_loss     | 3.41e+03 |
|    ent_coef        | 1.03     |
|    ent_coef_loss   | -0.0978  |
|    learning_rate   | 0.0003   |
|    n_updates       | 451      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 964      |
|    fps             | 3        |
|    time_elapsed    | 1180     |
|    total_timesteps | 3720     |
| train/             |          |
|    actor_loss      | -224     |
|    critic_loss     | 7.23e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.112   |
|    learning_rate   | 0.0003   |
|    n_updates       | 452      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 968      |
|    fps             | 3        |
|    time_elapsed    | 1186     |
|    total_timesteps | 3736     |
| train/             |          |
|    actor_loss      | -213     |
|    critic_loss     | 4.98e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.108   |
|    learning_rate   | 0.0003   |
|    n_updates       | 454      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 972      |
|    fps             | 3        |
|    time_elapsed    | 1189     |
|    total_timesteps | 3744     |
| train/             |          |
|    actor_loss      | -231     |
|    critic_loss     | 4.57e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.113   |
|    learning_rate   | 0.0003   |
|    n_updates       | 455      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 976      |
|    fps             | 3        |
|    time_elapsed    | 1195     |
|    total_timesteps | 3760     |
| train/             |          |
|    actor_loss      | -242     |
|    critic_loss     | 3.88e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.105   |
|    learning_rate   | 0.0003   |
|    n_updates       | 457      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 980      |
|    fps             | 3        |
|    time_elapsed    | 1199     |
|    total_timesteps | 3768     |
| train/             |          |
|    actor_loss      | -235     |
|    critic_loss     | 5.38e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.0998  |
|    learning_rate   | 0.0003   |
|    n_updates       | 458      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 984      |
|    fps             | 3        |
|    time_elapsed    | 1205     |
|    total_timesteps | 3784     |
| train/             |          |
|    actor_loss      | -220     |
|    critic_loss     | 6.79e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.105   |
|    learning_rate   | 0.0003   |
|    n_updates       | 460      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 988      |
|    fps             | 3        |
|    time_elapsed    | 1208     |
|    total_timesteps | 3792     |
| train/             |          |
|    actor_loss      | -234     |
|    critic_loss     | 8.59e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.112   |
|    learning_rate   | 0.0003   |
|    n_updates       | 461      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 992      |
|    fps             | 3        |
|    time_elapsed    | 1214     |
|    total_timesteps | 3808     |
| train/             |          |
|    actor_loss      | -246     |
|    critic_loss     | 2.37e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.115   |
|    learning_rate   | 0.0003   |
|    n_updates       | 463      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 996      |
|    fps             | 3        |
|    time_elapsed    | 1217     |
|    total_timesteps | 3816     |
| train/             |          |
|    actor_loss      | -246     |
|    critic_loss     | 4.45e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.114   |
|    learning_rate   | 0.0003   |
|    n_updates       | 464      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1000     |
|    fps             | 3        |
|    time_elapsed    | 1223     |
|    total_timesteps | 3832     |
| train/             |          |
|    actor_loss      | -247     |
|    critic_loss     | 4.29e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.122   |
|    learning_rate   | 0.0003   |
|    n_updates       | 466      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1004     |
|    fps             | 3        |
|    time_elapsed    | 1227     |
|    total_timesteps | 3840     |
| train/             |          |
|    actor_loss      | -249     |
|    critic_loss     | 2.86e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.118   |
|    learning_rate   | 0.0003   |
|    n_updates       | 467      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1008     |
|    fps             | 3        |
|    time_elapsed    | 1233     |
|    total_timesteps | 3856     |
| train/             |          |
|    actor_loss      | -247     |
|    critic_loss     | 3.88e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.123   |
|    learning_rate   | 0.0003   |
|    n_updates       | 469      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1012     |
|    fps             | 3        |
|    time_elapsed    | 1236     |
|    total_timesteps | 3864     |
| train/             |          |
|    actor_loss      | -240     |
|    critic_loss     | 5.87e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.136   |
|    learning_rate   | 0.0003   |
|    n_updates       | 470      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1016     |
|    fps             | 3        |
|    time_elapsed    | 1242     |
|    total_timesteps | 3880     |
| train/             |          |
|    actor_loss      | -248     |
|    critic_loss     | 4.96e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.132   |
|    learning_rate   | 0.0003   |
|    n_updates       | 472      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1020     |
|    fps             | 3        |
|    time_elapsed    | 1246     |
|    total_timesteps | 3888     |
| train/             |          |
|    actor_loss      | -245     |
|    critic_loss     | 4.08e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.136   |
|    learning_rate   | 0.0003   |
|    n_updates       | 473      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1024     |
|    fps             | 3        |
|    time_elapsed    | 1251     |
|    total_timesteps | 3904     |
| train/             |          |
|    actor_loss      | -238     |
|    critic_loss     | 4.28e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.137   |
|    learning_rate   | 0.0003   |
|    n_updates       | 475      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1028     |
|    fps             | 3        |
|    time_elapsed    | 1255     |
|    total_timesteps | 3912     |
| train/             |          |
|    actor_loss      | -250     |
|    critic_loss     | 2.21e+03 |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.141   |
|    learning_rate   | 0.0003   |
|    n_updates       | 476      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1032     |
|    fps             | 3        |
|    time_elapsed    | 1261     |
|    total_timesteps | 3928     |
| train/             |          |
|    actor_loss      | -271     |
|    critic_loss     | 6.3e+03  |
|    ent_coef        | 1.04     |
|    ent_coef_loss   | -0.14    |
|    learning_rate   | 0.0003   |
|    n_updates       | 478      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1036     |
|    fps             | 3        |
|    time_elapsed    | 1265     |
|    total_timesteps | 3936     |
| train/             |          |
|    actor_loss      | -241     |
|    critic_loss     | 5.22e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.153   |
|    learning_rate   | 0.0003   |
|    n_updates       | 479      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1040     |
|    fps             | 3        |
|    time_elapsed    | 1271     |
|    total_timesteps | 3952     |
| train/             |          |
|    actor_loss      | -259     |
|    critic_loss     | 5.21e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.136   |
|    learning_rate   | 0.0003   |
|    n_updates       | 481      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1044     |
|    fps             | 3        |
|    time_elapsed    | 1275     |
|    total_timesteps | 3960     |
| train/             |          |
|    actor_loss      | -233     |
|    critic_loss     | 4.91e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.147   |
|    learning_rate   | 0.0003   |
|    n_updates       | 482      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1048     |
|    fps             | 3        |
|    time_elapsed    | 1281     |
|    total_timesteps | 3976     |
| train/             |          |
|    actor_loss      | -239     |
|    critic_loss     | 4.48e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.153   |
|    learning_rate   | 0.0003   |
|    n_updates       | 484      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1052     |
|    fps             | 3        |
|    time_elapsed    | 1285     |
|    total_timesteps | 3984     |
| train/             |          |
|    actor_loss      | -241     |
|    critic_loss     | 3.91e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.145   |
|    learning_rate   | 0.0003   |
|    n_updates       | 485      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1056     |
|    fps             | 3        |
|    time_elapsed    | 1291     |
|    total_timesteps | 4000     |
| train/             |          |
|    actor_loss      | -238     |
|    critic_loss     | 4.85e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.175   |
|    learning_rate   | 0.0003   |
|    n_updates       | 487      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1060     |
|    fps             | 3        |
|    time_elapsed    | 1295     |
|    total_timesteps | 4008     |
| train/             |          |
|    actor_loss      | -240     |
|    critic_loss     | 4.45e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.174   |
|    learning_rate   | 0.0003   |
|    n_updates       | 488      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1064     |
|    fps             | 3        |
|    time_elapsed    | 1301     |
|    total_timesteps | 4024     |
| train/             |          |
|    actor_loss      | -246     |
|    critic_loss     | 3.73e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.173   |
|    learning_rate   | 0.0003   |
|    n_updates       | 490      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1068     |
|    fps             | 3        |
|    time_elapsed    | 1304     |
|    total_timesteps | 4032     |
| train/             |          |
|    actor_loss      | -240     |
|    critic_loss     | 2.88e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.154   |
|    learning_rate   | 0.0003   |
|    n_updates       | 491      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1072     |
|    fps             | 3        |
|    time_elapsed    | 1310     |
|    total_timesteps | 4048     |
| train/             |          |
|    actor_loss      | -250     |
|    critic_loss     | 3.5e+03  |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.155   |
|    learning_rate   | 0.0003   |
|    n_updates       | 493      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1076     |
|    fps             | 3        |
|    time_elapsed    | 1314     |
|    total_timesteps | 4056     |
| train/             |          |
|    actor_loss      | -243     |
|    critic_loss     | 4.11e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.15    |
|    learning_rate   | 0.0003   |
|    n_updates       | 494      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1080     |
|    fps             | 3        |
|    time_elapsed    | 1320     |
|    total_timesteps | 4072     |
| train/             |          |
|    actor_loss      | -230     |
|    critic_loss     | 2.71e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.16    |
|    learning_rate   | 0.0003   |
|    n_updates       | 496      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1084     |
|    fps             | 3        |
|    time_elapsed    | 1324     |
|    total_timesteps | 4080     |
| train/             |          |
|    actor_loss      | -263     |
|    critic_loss     | 5.67e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.172   |
|    learning_rate   | 0.0003   |
|    n_updates       | 497      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1088     |
|    fps             | 3        |
|    time_elapsed    | 1330     |
|    total_timesteps | 4096     |
| train/             |          |
|    actor_loss      | -234     |
|    critic_loss     | 5.12e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.189   |
|    learning_rate   | 0.0003   |
|    n_updates       | 499      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1092     |
|    fps             | 3        |
|    time_elapsed    | 1333     |
|    total_timesteps | 4104     |
| train/             |          |
|    actor_loss      | -254     |
|    critic_loss     | 7.68e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.185   |
|    learning_rate   | 0.0003   |
|    n_updates       | 500      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1096     |
|    fps             | 3        |
|    time_elapsed    | 1339     |
|    total_timesteps | 4120     |
| train/             |          |
|    actor_loss      | -244     |
|    critic_loss     | 2.18e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.194   |
|    learning_rate   | 0.0003   |
|    n_updates       | 502      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1100     |
|    fps             | 3        |
|    time_elapsed    | 1343     |
|    total_timesteps | 4128     |
| train/             |          |
|    actor_loss      | -256     |
|    critic_loss     | 5.33e+03 |
|    ent_coef        | 1.05     |
|    ent_coef_loss   | -0.19    |
|    learning_rate   | 0.0003   |
|    n_updates       | 503      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1104     |
|    fps             | 3        |
|    time_elapsed    | 1349     |
|    total_timesteps | 4144     |
| train/             |          |
|    actor_loss      | -263     |
|    critic_loss     | 2.97e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.185   |
|    learning_rate   | 0.0003   |
|    n_updates       | 505      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 511      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1108     |
|    fps             | 3        |
|    time_elapsed    | 1353     |
|    total_timesteps | 4152     |
| train/             |          |
|    actor_loss      | -259     |
|    critic_loss     | 3.6e+03  |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.169   |
|    learning_rate   | 0.0003   |
|    n_updates       | 506      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1112     |
|    fps             | 3        |
|    time_elapsed    | 1359     |
|    total_timesteps | 4168     |
| train/             |          |
|    actor_loss      | -258     |
|    critic_loss     | 3.68e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.169   |
|    learning_rate   | 0.0003   |
|    n_updates       | 508      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1116     |
|    fps             | 3        |
|    time_elapsed    | 1362     |
|    total_timesteps | 4176     |
| train/             |          |
|    actor_loss      | -257     |
|    critic_loss     | 5.19e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.187   |
|    learning_rate   | 0.0003   |
|    n_updates       | 509      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1120     |
|    fps             | 3        |
|    time_elapsed    | 1368     |
|    total_timesteps | 4192     |
| train/             |          |
|    actor_loss      | -261     |
|    critic_loss     | 3.18e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.213   |
|    learning_rate   | 0.0003   |
|    n_updates       | 511      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1124     |
|    fps             | 3        |
|    time_elapsed    | 1372     |
|    total_timesteps | 4200     |
| train/             |          |
|    actor_loss      | -260     |
|    critic_loss     | 5.04e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.216   |
|    learning_rate   | 0.0003   |
|    n_updates       | 512      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1128     |
|    fps             | 3        |
|    time_elapsed    | 1378     |
|    total_timesteps | 4216     |
| train/             |          |
|    actor_loss      | -261     |
|    critic_loss     | 3.03e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.232   |
|    learning_rate   | 0.0003   |
|    n_updates       | 514      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1132     |
|    fps             | 3        |
|    time_elapsed    | 1381     |
|    total_timesteps | 4224     |
| train/             |          |
|    actor_loss      | -269     |
|    critic_loss     | 3.06e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.215   |
|    learning_rate   | 0.0003   |
|    n_updates       | 515      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1136     |
|    fps             | 3        |
|    time_elapsed    | 1387     |
|    total_timesteps | 4240     |
| train/             |          |
|    actor_loss      | -264     |
|    critic_loss     | 3.97e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.209   |
|    learning_rate   | 0.0003   |
|    n_updates       | 517      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1140     |
|    fps             | 3        |
|    time_elapsed    | 1391     |
|    total_timesteps | 4248     |
| train/             |          |
|    actor_loss      | -267     |
|    critic_loss     | 3.39e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.211   |
|    learning_rate   | 0.0003   |
|    n_updates       | 518      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1144     |
|    fps             | 3        |
|    time_elapsed    | 1397     |
|    total_timesteps | 4264     |
| train/             |          |
|    actor_loss      | -269     |
|    critic_loss     | 4.51e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.195   |
|    learning_rate   | 0.0003   |
|    n_updates       | 520      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1148     |
|    fps             | 3        |
|    time_elapsed    | 1400     |
|    total_timesteps | 4272     |
| train/             |          |
|    actor_loss      | -268     |
|    critic_loss     | 2.84e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.209   |
|    learning_rate   | 0.0003   |
|    n_updates       | 521      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1152     |
|    fps             | 3        |
|    time_elapsed    | 1406     |
|    total_timesteps | 4288     |
| train/             |          |
|    actor_loss      | -258     |
|    critic_loss     | 2.61e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.209   |
|    learning_rate   | 0.0003   |
|    n_updates       | 523      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1156     |
|    fps             | 3        |
|    time_elapsed    | 1409     |
|    total_timesteps | 4296     |
| train/             |          |
|    actor_loss      | -269     |
|    critic_loss     | 2.22e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.209   |
|    learning_rate   | 0.0003   |
|    n_updates       | 524      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1160     |
|    fps             | 3        |
|    time_elapsed    | 1415     |
|    total_timesteps | 4312     |
| train/             |          |
|    actor_loss      | -273     |
|    critic_loss     | 2.79e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.227   |
|    learning_rate   | 0.0003   |
|    n_updates       | 526      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1164     |
|    fps             | 3        |
|    time_elapsed    | 1419     |
|    total_timesteps | 4320     |
| train/             |          |
|    actor_loss      | -269     |
|    critic_loss     | 2.41e+03 |
|    ent_coef        | 1.06     |
|    ent_coef_loss   | -0.226   |
|    learning_rate   | 0.0003   |
|    n_updates       | 527      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1168     |
|    fps             | 3        |
|    time_elapsed    | 1425     |
|    total_timesteps | 4336     |
| train/             |          |
|    actor_loss      | -270     |
|    critic_loss     | 2.65e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.232   |
|    learning_rate   | 0.0003   |
|    n_updates       | 529      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1172     |
|    fps             | 3        |
|    time_elapsed    | 1428     |
|    total_timesteps | 4344     |
| train/             |          |
|    actor_loss      | -261     |
|    critic_loss     | 5.49e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.232   |
|    learning_rate   | 0.0003   |
|    n_updates       | 530      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1176     |
|    fps             | 3        |
|    time_elapsed    | 1434     |
|    total_timesteps | 4360     |
| train/             |          |
|    actor_loss      | -260     |
|    critic_loss     | 5.19e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.236   |
|    learning_rate   | 0.0003   |
|    n_updates       | 532      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1180     |
|    fps             | 3        |
|    time_elapsed    | 1438     |
|    total_timesteps | 4368     |
| train/             |          |
|    actor_loss      | -263     |
|    critic_loss     | 2.5e+03  |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.225   |
|    learning_rate   | 0.0003   |
|    n_updates       | 533      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1184     |
|    fps             | 3        |
|    time_elapsed    | 1444     |
|    total_timesteps | 4384     |
| train/             |          |
|    actor_loss      | -267     |
|    critic_loss     | 2.25e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.226   |
|    learning_rate   | 0.0003   |
|    n_updates       | 535      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1188     |
|    fps             | 3        |
|    time_elapsed    | 1447     |
|    total_timesteps | 4392     |
| train/             |          |
|    actor_loss      | -283     |
|    critic_loss     | 2.62e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.245   |
|    learning_rate   | 0.0003   |
|    n_updates       | 536      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1192     |
|    fps             | 3        |
|    time_elapsed    | 1453     |
|    total_timesteps | 4408     |
| train/             |          |
|    actor_loss      | -269     |
|    critic_loss     | 4.62e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.25    |
|    learning_rate   | 0.0003   |
|    n_updates       | 538      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1196     |
|    fps             | 3        |
|    time_elapsed    | 1456     |
|    total_timesteps | 4416     |
| train/             |          |
|    actor_loss      | -267     |
|    critic_loss     | 4.53e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.258   |
|    learning_rate   | 0.0003   |
|    n_updates       | 539      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1200     |
|    fps             | 3        |
|    time_elapsed    | 1462     |
|    total_timesteps | 4432     |
| train/             |          |
|    actor_loss      | -274     |
|    critic_loss     | 5.24e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.245   |
|    learning_rate   | 0.0003   |
|    n_updates       | 541      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1204     |
|    fps             | 3        |
|    time_elapsed    | 1466     |
|    total_timesteps | 4440     |
| train/             |          |
|    actor_loss      | -286     |
|    critic_loss     | 2.44e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.259   |
|    learning_rate   | 0.0003   |
|    n_updates       | 542      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1208     |
|    fps             | 3        |
|    time_elapsed    | 1472     |
|    total_timesteps | 4456     |
| train/             |          |
|    actor_loss      | -289     |
|    critic_loss     | 4.27e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.267   |
|    learning_rate   | 0.0003   |
|    n_updates       | 544      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1212     |
|    fps             | 3        |
|    time_elapsed    | 1475     |
|    total_timesteps | 4464     |
| train/             |          |
|    actor_loss      | -270     |
|    critic_loss     | 3.68e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.257   |
|    learning_rate   | 0.0003   |
|    n_updates       | 545      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1216     |
|    fps             | 3        |
|    time_elapsed    | 1481     |
|    total_timesteps | 4480     |
| train/             |          |
|    actor_loss      | -280     |
|    critic_loss     | 3.81e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.261   |
|    learning_rate   | 0.0003   |
|    n_updates       | 547      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1220     |
|    fps             | 3        |
|    time_elapsed    | 1485     |
|    total_timesteps | 4488     |
| train/             |          |
|    actor_loss      | -275     |
|    critic_loss     | 2.9e+03  |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.255   |
|    learning_rate   | 0.0003   |
|    n_updates       | 548      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1224     |
|    fps             | 3        |
|    time_elapsed    | 1491     |
|    total_timesteps | 4504     |
| train/             |          |
|    actor_loss      | -277     |
|    critic_loss     | 3.15e+03 |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.269   |
|    learning_rate   | 0.0003   |
|    n_updates       | 550      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1228     |
|    fps             | 3        |
|    time_elapsed    | 1494     |
|    total_timesteps | 4512     |
| train/             |          |
|    actor_loss      | -291     |
|    critic_loss     | 2.7e+03  |
|    ent_coef        | 1.07     |
|    ent_coef_loss   | -0.257   |
|    learning_rate   | 0.0003   |
|    n_updates       | 551      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1232     |
|    fps             | 3        |
|    time_elapsed    | 1500     |
|    total_timesteps | 4528     |
| train/             |          |
|    actor_loss      | -289     |
|    critic_loss     | 3.97e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.284   |
|    learning_rate   | 0.0003   |
|    n_updates       | 553      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1236     |
|    fps             | 3        |
|    time_elapsed    | 1504     |
|    total_timesteps | 4536     |
| train/             |          |
|    actor_loss      | -285     |
|    critic_loss     | 3.75e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.299   |
|    learning_rate   | 0.0003   |
|    n_updates       | 554      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1240     |
|    fps             | 3        |
|    time_elapsed    | 1510     |
|    total_timesteps | 4552     |
| train/             |          |
|    actor_loss      | -284     |
|    critic_loss     | 2.01e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.297   |
|    learning_rate   | 0.0003   |
|    n_updates       | 556      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1244     |
|    fps             | 3        |
|    time_elapsed    | 1513     |
|    total_timesteps | 4560     |
| train/             |          |
|    actor_loss      | -298     |
|    critic_loss     | 3.04e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.289   |
|    learning_rate   | 0.0003   |
|    n_updates       | 557      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1248     |
|    fps             | 3        |
|    time_elapsed    | 1519     |
|    total_timesteps | 4576     |
| train/             |          |
|    actor_loss      | -279     |
|    critic_loss     | 3.16e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.265   |
|    learning_rate   | 0.0003   |
|    n_updates       | 559      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1252     |
|    fps             | 3        |
|    time_elapsed    | 1522     |
|    total_timesteps | 4584     |
| train/             |          |
|    actor_loss      | -274     |
|    critic_loss     | 2.04e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.268   |
|    learning_rate   | 0.0003   |
|    n_updates       | 560      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1256     |
|    fps             | 3        |
|    time_elapsed    | 1528     |
|    total_timesteps | 4600     |
| train/             |          |
|    actor_loss      | -283     |
|    critic_loss     | 2.61e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.294   |
|    learning_rate   | 0.0003   |
|    n_updates       | 562      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1260     |
|    fps             | 3        |
|    time_elapsed    | 1532     |
|    total_timesteps | 4608     |
| train/             |          |
|    actor_loss      | -304     |
|    critic_loss     | 2.19e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.3     |
|    learning_rate   | 0.0003   |
|    n_updates       | 563      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1264     |
|    fps             | 3        |
|    time_elapsed    | 1538     |
|    total_timesteps | 4624     |
| train/             |          |
|    actor_loss      | -292     |
|    critic_loss     | 1.96e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.319   |
|    learning_rate   | 0.0003   |
|    n_updates       | 565      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1268     |
|    fps             | 3        |
|    time_elapsed    | 1541     |
|    total_timesteps | 4632     |
| train/             |          |
|    actor_loss      | -300     |
|    critic_loss     | 2.52e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.319   |
|    learning_rate   | 0.0003   |
|    n_updates       | 566      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1272     |
|    fps             | 3        |
|    time_elapsed    | 1547     |
|    total_timesteps | 4648     |
| train/             |          |
|    actor_loss      | -291     |
|    critic_loss     | 4.07e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.313   |
|    learning_rate   | 0.0003   |
|    n_updates       | 568      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1276     |
|    fps             | 3        |
|    time_elapsed    | 1551     |
|    total_timesteps | 4656     |
| train/             |          |
|    actor_loss      | -293     |
|    critic_loss     | 1.45e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.311   |
|    learning_rate   | 0.0003   |
|    n_updates       | 569      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1280     |
|    fps             | 3        |
|    time_elapsed    | 1556     |
|    total_timesteps | 4672     |
| train/             |          |
|    actor_loss      | -299     |
|    critic_loss     | 3.08e+03 |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.325   |
|    learning_rate   | 0.0003   |
|    n_updates       | 571      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1284     |
|    fps             | 2        |
|    time_elapsed    | 1560     |
|    total_timesteps | 4680     |
| train/             |          |
|    actor_loss      | -284     |
|    critic_loss     | 3.5e+03  |
|    ent_coef        | 1.08     |
|    ent_coef_loss   | -0.308   |
|    learning_rate   | 0.0003   |
|    n_updates       | 572      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1288     |
|    fps             | 2        |
|    time_elapsed    | 1566     |
|    total_timesteps | 4696     |
| train/             |          |
|    actor_loss      | -277     |
|    critic_loss     | 2.47e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.317   |
|    learning_rate   | 0.0003   |
|    n_updates       | 574      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1292     |
|    fps             | 2        |
|    time_elapsed    | 1569     |
|    total_timesteps | 4704     |
| train/             |          |
|    actor_loss      | -290     |
|    critic_loss     | 3.46e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.316   |
|    learning_rate   | 0.0003   |
|    n_updates       | 575      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1296     |
|    fps             | 2        |
|    time_elapsed    | 1575     |
|    total_timesteps | 4720     |
| train/             |          |
|    actor_loss      | -289     |
|    critic_loss     | 1.65e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.318   |
|    learning_rate   | 0.0003   |
|    n_updates       | 577      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1300     |
|    fps             | 2        |
|    time_elapsed    | 1579     |
|    total_timesteps | 4728     |
| train/             |          |
|    actor_loss      | -299     |
|    critic_loss     | 1.68e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.326   |
|    learning_rate   | 0.0003   |
|    n_updates       | 578      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1304     |
|    fps             | 2        |
|    time_elapsed    | 1585     |
|    total_timesteps | 4744     |
| train/             |          |
|    actor_loss      | -284     |
|    critic_loss     | 2.3e+03  |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.331   |
|    learning_rate   | 0.0003   |
|    n_updates       | 580      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1308     |
|    fps             | 2        |
|    time_elapsed    | 1588     |
|    total_timesteps | 4752     |
| train/             |          |
|    actor_loss      | -302     |
|    critic_loss     | 2.6e+03  |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.344   |
|    learning_rate   | 0.0003   |
|    n_updates       | 581      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1312     |
|    fps             | 2        |
|    time_elapsed    | 1594     |
|    total_timesteps | 4768     |
| train/             |          |
|    actor_loss      | -302     |
|    critic_loss     | 2.44e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.33    |
|    learning_rate   | 0.0003   |
|    n_updates       | 583      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1316     |
|    fps             | 2        |
|    time_elapsed    | 1598     |
|    total_timesteps | 4776     |
| train/             |          |
|    actor_loss      | -298     |
|    critic_loss     | 2.65e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.344   |
|    learning_rate   | 0.0003   |
|    n_updates       | 584      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 509      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1320     |
|    fps             | 2        |
|    time_elapsed    | 1604     |
|    total_timesteps | 4792     |
| train/             |          |
|    actor_loss      | -307     |
|    critic_loss     | 2.48e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.337   |
|    learning_rate   | 0.0003   |
|    n_updates       | 586      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 509      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1324     |
|    fps             | 2        |
|    time_elapsed    | 1607     |
|    total_timesteps | 4800     |
| train/             |          |
|    actor_loss      | -301     |
|    critic_loss     | 2.56e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.346   |
|    learning_rate   | 0.0003   |
|    n_updates       | 587      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1328     |
|    fps             | 2        |
|    time_elapsed    | 1613     |
|    total_timesteps | 4816     |
| train/             |          |
|    actor_loss      | -293     |
|    critic_loss     | 1.05e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.348   |
|    learning_rate   | 0.0003   |
|    n_updates       | 589      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1332     |
|    fps             | 2        |
|    time_elapsed    | 1617     |
|    total_timesteps | 4824     |
| train/             |          |
|    actor_loss      | -292     |
|    critic_loss     | 3.2e+03  |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.333   |
|    learning_rate   | 0.0003   |
|    n_updates       | 590      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1336     |
|    fps             | 2        |
|    time_elapsed    | 1623     |
|    total_timesteps | 4840     |
| train/             |          |
|    actor_loss      | -305     |
|    critic_loss     | 3.84e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.357   |
|    learning_rate   | 0.0003   |
|    n_updates       | 592      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1340     |
|    fps             | 2        |
|    time_elapsed    | 1626     |
|    total_timesteps | 4848     |
| train/             |          |
|    actor_loss      | -290     |
|    critic_loss     | 4.38e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.335   |
|    learning_rate   | 0.0003   |
|    n_updates       | 593      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1344     |
|    fps             | 2        |
|    time_elapsed    | 1632     |
|    total_timesteps | 4864     |
| train/             |          |
|    actor_loss      | -304     |
|    critic_loss     | 2.72e+03 |
|    ent_coef        | 1.09     |
|    ent_coef_loss   | -0.374   |
|    learning_rate   | 0.0003   |
|    n_updates       | 595      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1348     |
|    fps             | 2        |
|    time_elapsed    | 1636     |
|    total_timesteps | 4872     |
| train/             |          |
|    actor_loss      | -280     |
|    critic_loss     | 1.19e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.372   |
|    learning_rate   | 0.0003   |
|    n_updates       | 596      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1352     |
|    fps             | 2        |
|    time_elapsed    | 1642     |
|    total_timesteps | 4888     |
| train/             |          |
|    actor_loss      | -305     |
|    critic_loss     | 3.53e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.392   |
|    learning_rate   | 0.0003   |
|    n_updates       | 598      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1356     |
|    fps             | 2        |
|    time_elapsed    | 1645     |
|    total_timesteps | 4896     |
| train/             |          |
|    actor_loss      | -302     |
|    critic_loss     | 2.49e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.381   |
|    learning_rate   | 0.0003   |
|    n_updates       | 599      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1360     |
|    fps             | 2        |
|    time_elapsed    | 1651     |
|    total_timesteps | 4912     |
| train/             |          |
|    actor_loss      | -318     |
|    critic_loss     | 2.98e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.373   |
|    learning_rate   | 0.0003   |
|    n_updates       | 601      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1364     |
|    fps             | 2        |
|    time_elapsed    | 1655     |
|    total_timesteps | 4920     |
| train/             |          |
|    actor_loss      | -306     |
|    critic_loss     | 1.68e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.385   |
|    learning_rate   | 0.0003   |
|    n_updates       | 602      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1368     |
|    fps             | 2        |
|    time_elapsed    | 1661     |
|    total_timesteps | 4936     |
| train/             |          |
|    actor_loss      | -316     |
|    critic_loss     | 5.61e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.368   |
|    learning_rate   | 0.0003   |
|    n_updates       | 604      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1372     |
|    fps             | 2        |
|    time_elapsed    | 1664     |
|    total_timesteps | 4944     |
| train/             |          |
|    actor_loss      | -311     |
|    critic_loss     | 1.02e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.383   |
|    learning_rate   | 0.0003   |
|    n_updates       | 605      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1376     |
|    fps             | 2        |
|    time_elapsed    | 1670     |
|    total_timesteps | 4960     |
| train/             |          |
|    actor_loss      | -299     |
|    critic_loss     | 3.64e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.405   |
|    learning_rate   | 0.0003   |
|    n_updates       | 607      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1380     |
|    fps             | 2        |
|    time_elapsed    | 1674     |
|    total_timesteps | 4968     |
| train/             |          |
|    actor_loss      | -300     |
|    critic_loss     | 2.69e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.409   |
|    learning_rate   | 0.0003   |
|    n_updates       | 608      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1384     |
|    fps             | 2        |
|    time_elapsed    | 1680     |
|    total_timesteps | 4984     |
| train/             |          |
|    actor_loss      | -326     |
|    critic_loss     | 1.65e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.404   |
|    learning_rate   | 0.0003   |
|    n_updates       | 610      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1388     |
|    fps             | 2        |
|    time_elapsed    | 1683     |
|    total_timesteps | 4992     |
| train/             |          |
|    actor_loss      | -298     |
|    critic_loss     | 1e+03    |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.422   |
|    learning_rate   | 0.0003   |
|    n_updates       | 611      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1392     |
|    fps             | 2        |
|    time_elapsed    | 1689     |
|    total_timesteps | 5008     |
| train/             |          |
|    actor_loss      | -314     |
|    critic_loss     | 1.84e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.41    |
|    learning_rate   | 0.0003   |
|    n_updates       | 613      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1396     |
|    fps             | 2        |
|    time_elapsed    | 1693     |
|    total_timesteps | 5016     |
| train/             |          |
|    actor_loss      | -305     |
|    critic_loss     | 3.37e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.386   |
|    learning_rate   | 0.0003   |
|    n_updates       | 614      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1400     |
|    fps             | 2        |
|    time_elapsed    | 1699     |
|    total_timesteps | 5032     |
| train/             |          |
|    actor_loss      | -316     |
|    critic_loss     | 3.82e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.399   |
|    learning_rate   | 0.0003   |
|    n_updates       | 616      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1404     |
|    fps             | 2        |
|    time_elapsed    | 1702     |
|    total_timesteps | 5040     |
| train/             |          |
|    actor_loss      | -298     |
|    critic_loss     | 3.03e+03 |
|    ent_coef        | 1.1      |
|    ent_coef_loss   | -0.386   |
|    learning_rate   | 0.0003   |
|    n_updates       | 617      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1408     |
|    fps             | 2        |
|    time_elapsed    | 1708     |
|    total_timesteps | 5056     |
| train/             |          |
|    actor_loss      | -309     |
|    critic_loss     | 1.72e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.393   |
|    learning_rate   | 0.0003   |
|    n_updates       | 619      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1412     |
|    fps             | 2        |
|    time_elapsed    | 1712     |
|    total_timesteps | 5064     |
| train/             |          |
|    actor_loss      | -306     |
|    critic_loss     | 4.96e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.416   |
|    learning_rate   | 0.0003   |
|    n_updates       | 620      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1416     |
|    fps             | 2        |
|    time_elapsed    | 1718     |
|    total_timesteps | 5080     |
| train/             |          |
|    actor_loss      | -323     |
|    critic_loss     | 1.89e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.452   |
|    learning_rate   | 0.0003   |
|    n_updates       | 622      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1420     |
|    fps             | 2        |
|    time_elapsed    | 1721     |
|    total_timesteps | 5088     |
| train/             |          |
|    actor_loss      | -306     |
|    critic_loss     | 830      |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.459   |
|    learning_rate   | 0.0003   |
|    n_updates       | 623      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1424     |
|    fps             | 2        |
|    time_elapsed    | 1727     |
|    total_timesteps | 5104     |
| train/             |          |
|    actor_loss      | -315     |
|    critic_loss     | 983      |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.436   |
|    learning_rate   | 0.0003   |
|    n_updates       | 625      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1428     |
|    fps             | 2        |
|    time_elapsed    | 1731     |
|    total_timesteps | 5112     |
| train/             |          |
|    actor_loss      | -314     |
|    critic_loss     | 1.26e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.417   |
|    learning_rate   | 0.0003   |
|    n_updates       | 626      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1432     |
|    fps             | 2        |
|    time_elapsed    | 1736     |
|    total_timesteps | 5128     |
| train/             |          |
|    actor_loss      | -319     |
|    critic_loss     | 1.36e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.436   |
|    learning_rate   | 0.0003   |
|    n_updates       | 628      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1436     |
|    fps             | 2        |
|    time_elapsed    | 1740     |
|    total_timesteps | 5136     |
| train/             |          |
|    actor_loss      | -323     |
|    critic_loss     | 2.8e+03  |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.431   |
|    learning_rate   | 0.0003   |
|    n_updates       | 629      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 509      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1440     |
|    fps             | 2        |
|    time_elapsed    | 1746     |
|    total_timesteps | 5152     |
| train/             |          |
|    actor_loss      | -315     |
|    critic_loss     | 2.26e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.451   |
|    learning_rate   | 0.0003   |
|    n_updates       | 631      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1444     |
|    fps             | 2        |
|    time_elapsed    | 1752     |
|    total_timesteps | 5160     |
| train/             |          |
|    actor_loss      | -323     |
|    critic_loss     | 2.09e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.428   |
|    learning_rate   | 0.0003   |
|    n_updates       | 632      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1448     |
|    fps             | 2        |
|    time_elapsed    | 1761     |
|    total_timesteps | 5176     |
| train/             |          |
|    actor_loss      | -320     |
|    critic_loss     | 1.8e+03  |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.456   |
|    learning_rate   | 0.0003   |
|    n_updates       | 634      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1452     |
|    fps             | 2        |
|    time_elapsed    | 1767     |
|    total_timesteps | 5184     |
| train/             |          |
|    actor_loss      | -320     |
|    critic_loss     | 2.14e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.455   |
|    learning_rate   | 0.0003   |
|    n_updates       | 635      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1456     |
|    fps             | 2        |
|    time_elapsed    | 1777     |
|    total_timesteps | 5200     |
| train/             |          |
|    actor_loss      | -328     |
|    critic_loss     | 5.26e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.453   |
|    learning_rate   | 0.0003   |
|    n_updates       | 637      |
---------------------------------


---------------------------------
| rollout/           |          |
|    ep_len_mean     | 3        |
|    ep_rew_mean     | 510      |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 1460     |
|    fps             | 2        |
|    time_elapsed    | 1780     |
|    total_timesteps | 5208     |
| train/             |          |
|    actor_loss      | -321     |
|    critic_loss     | 1.94e+03 |
|    ent_coef        | 1.11     |
|    ent_coef_loss   | -0.467   |
|    learning_rate   | 0.0003   |
|    n_updates       | 638      |
---------------------------------


In [None]:
import gymnasium as gym
import torch as th
from twsbr_env.envs import TwsbrEnv  # Import environment
from stable_baselines3 import SAC
from stable_baselines3.common.evaluation import evaluate_policy
import os

# Buat lingkungan dengan parameter spesifik
env = gym.make("TwsbrEnv-v0", render_mode=None, action_type="continuous")

# Path model terbaik
best_model_path = "./logs/best_model.zip"

# Cek apakah model terbaik tersedia
if os.path.exists(best_model_path):
    print(f"Loading best model from {best_model_path}")
    model = SAC.load(best_model_path, env=env)
else:
    print("No existing best model found, initializing a new model.")
    model = SAC(
        "MlpPolicy", env,
        policy_kwargs=dict(net_arch=dict(pi=[256, 256], qf=[256, 256])),
        use_sde=True, ent_coef="auto_0.1",
        verbose=1,
    )

# Training lanjutan
total_timesteps_learning = 500_000  # Sesuaikan jumlah timesteps tambahan
model.learn(total_timesteps=total_timesteps_learning)

# Simpan model setelah training lanjutan
model.save("twsbr_sac_continued")
print("Training continuation finished")

# Evaluasi model terbaik
n_eval_episodes = 10
render = False  # Set to True jika ingin melihat visualisasi evaluasi
mean_reward, std_reward = evaluate_policy(model, model.get_env(), n_eval_episodes=n_eval_episodes, render=render)

# Print hasil evaluasi
print(f"Mean Reward over {n_eval_episodes} episodes: {mean_reward:.2f} +/- {std_reward:.2f}")

env.close()  # Menutup lingkungan
del model  # Hapus model dari memori untuk pembersihan


Loading best model from ./logs/best_model.zip
Wrapping the env with a `Monitor` wrapper
Wrapping the env in a DummyVecEnv.
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 8.5      |
|    ep_rew_mean     | -102     |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 4        |
|    fps             | 7        |
|    time_elapsed    | 4        |
|    total_timesteps | 34       |
| train/             |          |
|    std             | 0.0622   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 7.25     |
|    ep_rew_mean     | -103     |
|    success_rate    | 0        |
| time/              |          |
|    episodes        | 8        |
|    fps             | 7        |
|    time_elapsed    | 8        |
|    total_timesteps | 58       |
| train/             |          |
|    std             | 0.0622   |
---------------------------

In [None]:
import numpy as np
import matplotlib.pyplot as plt
import gymnasium as gym
from twsbr_env.envs import TwsbrEnv  # Import environment
from stable_baselines3 import SAC

# Muat kembali lingkungan dan model
env = gym.make("TwsbrEnv-v0", render_mode="human", action_type="continuous")
model = SAC.load("twsbr_sac")

# Variabel penyimpanan data
obs_values = []
action_values = []

obs, info = env.reset()
terminated = False
truncated = False

def plot_results(obs_values, action_values):
    plt.figure(figsize=(12, 8))
    
    # Plot observasi
    for i in range(6):  # Karena ada 6 nilai observasi
        plt.subplot(3, 1, 1)
        plt.plot([obs[i] for obs in obs_values], label=f'Observation[{i}]')
    plt.xlabel("Time Step")
    plt.ylabel("Observation Value")
    plt.legend()
    plt.grid()
    
    # Plot aksi
    for i in range(2):  # Karena ada 2 nilai aksi
        plt.subplot(3, 1, 2)
        plt.plot([action[i] for action in action_values], label=f'Action[{i}]')
    plt.xlabel("Time Step")
    plt.ylabel("Action Value")
    plt.legend()
    plt.grid()
    
    plt.tight_layout()
    plt.show()

for _ in range(10000):  # Jumlah langkah evaluasi
    action, _states = model.predict(obs, deterministic=True)
    obs_values.append(obs)
    action_values.append(action)
    obs, reward, terminated, truncated, info = env.step(action)
    
    if terminated:
        obs, info = env.reset()

# Tampilkan grafik
plot_results(obs_values, action_values)

# Menutup lingkungan
env.close()
