# Environment Setup

In [1]:
#!pip install gym gym-retro, opencv-python
#!pip install mss
#!pip install pydirectinput

In [2]:
# For monitoring agent
from stable_baselines3.common.monitor import Monitor
# To vectorize and frame stack
from stable_baselines3.common.vec_env import DummyVecEnv, VecFrameStack

In [3]:
# Running Environment_Setup.ipynb to setup custom Flappy_Bird environment.
%run tools\Environment.py

In [4]:
LOG_DIR = './logs/'

In [5]:
# Creating environment 
env = Flappy_Bird()
env = Monitor(env, LOG_DIR)
env = DummyVecEnv([lambda: env])
env = VecFrameStack(env, 4, channels_order='last')

# Setup Callback To Monitor Training Process

In [6]:
#!pip install stable-baselines3[extra]

In [7]:
# Import os for file path management
import os 
# Import Base Callback for saving models
from stable_baselines3.common.callbacks import BaseCallback

In [8]:
class TrainAndLoggingCallback(BaseCallback):

    def __init__(self, check_freq, save_path, verbose=1):
        super(TrainAndLoggingCallback, self).__init__(verbose)
        self.check_freq = check_freq
        self.save_path = save_path

    def _init_callback(self):
        if self.save_path is not None:
            os.makedirs(self.save_path, exist_ok=True)

    def _on_step(self):
        if self.n_calls % self.check_freq == 0:
            model_path = os.path.join(self.save_path, 'best_model_{}'.format(self.n_calls))
            self.model.save(model_path)

        return True

In [9]:
CHECKPOINT_DIR = './train/'

In [10]:
callback = TrainAndLoggingCallback(check_freq=40_000, save_path=CHECKPOINT_DIR)

# Training Model

In [11]:
# Model
from stable_baselines3 import DQN

In [12]:
# parameters
parameters = {'buffer_size': 10_000, 
              'learning_starts': 1000, 
              "learning_rate":0.00006, 
              "batch_size":16,
              "target_update_interval":500, 
              "exploration_fraction":0.99, 
              "exploration_initial_eps":0.04,
              "exploration_final_eps":0.0001
             }

In [13]:
# Creating the model
model = DQN('CnnPolicy', env, tensorboard_log=LOG_DIR, verbose=1, **parameters)

Using cpu device


In [14]:
# Loading wages of other model
model.set_parameters("train/FlappyBird_DQN_Easy")
# Loading replay buffer
model.load_replay_buffer("train/buffer_FlappyBird_DQN_Easy")

In [15]:
# Training the model
model.learn(total_timesteps=80_000, callback=callback)

Logging to ./logs/DQN_12
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.75     |
|    ep_rew_mean      | 9.75     |
|    exploration_rate | 0.1      |
| time/               |          |
|    episodes         | 4        |
|    fps              | 1        |
|    time_elapsed     | 29       |
|    total_timesteps  | 39       |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 13.5     |
|    ep_rew_mean      | 13.5     |
|    exploration_rate | 0.0999   |
| time/               |          |
|    episodes         | 8        |
|    fps              | 1        |
|    time_elapsed     | 61       |
|    total_timesteps  | 108      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 11.7     |
|    ep_rew_mean      | 11.7     |
|    exploration_rate | 0.0999   |
| time/               |       

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 11.6     |
|    ep_rew_mean      | 11.6     |
|    exploration_rate | 0.0994   |
| time/               |          |
|    episodes         | 92       |
|    fps              | 1        |
|    time_elapsed     | 558      |
|    total_timesteps  | 1063     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.23     |
|    n_updates        | 15       |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 11.7     |
|    ep_rew_mean      | 11.7     |
|    exploration_rate | 0.0993   |
| time/               |          |
|    episodes         | 96       |
|    fps              | 1        |
|    time_elapsed     | 587      |
|    total_timesteps  | 1123     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.319    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 14.2     |
|    ep_rew_mean      | 14.2     |
|    exploration_rate | 0.0988   |
| time/               |          |
|    episodes         | 156      |
|    fps              | 2        |
|    time_elapsed     | 996      |
|    total_timesteps  | 2000     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 17.2     |
|    n_updates        | 249      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 14.2     |
|    ep_rew_mean      | 14.2     |
|    exploration_rate | 0.0988   |
| time/               |          |
|    episodes         | 160      |
|    fps              | 2        |
|    time_elapsed     | 1023     |
|    total_timesteps  | 2058     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 7.22     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 13.2     |
|    ep_rew_mean      | 13.2     |
|    exploration_rate | 0.0984   |
| time/               |          |
|    episodes         | 220      |
|    fps              | 1        |
|    time_elapsed     | 1392     |
|    total_timesteps  | 2767     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.772    |
|    n_updates        | 441      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 13.3     |
|    ep_rew_mean      | 13.3     |
|    exploration_rate | 0.0983   |
| time/               |          |
|    episodes         | 224      |
|    fps              | 1        |
|    time_elapsed     | 1420     |
|    total_timesteps  | 2828     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.98     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 13       |
|    ep_rew_mean      | 13       |
|    exploration_rate | 0.0978   |
| time/               |          |
|    episodes         | 284      |
|    fps              | 2        |
|    time_elapsed     | 1820     |
|    total_timesteps  | 3648     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.13     |
|    n_updates        | 661      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 13.1     |
|    ep_rew_mean      | 13.1     |
|    exploration_rate | 0.0978   |
| time/               |          |
|    episodes         | 288      |
|    fps              | 2        |
|    time_elapsed     | 1848     |
|    total_timesteps  | 3705     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.15     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 14.8     |
|    ep_rew_mean      | 14.8     |
|    exploration_rate | 0.0972   |
| time/               |          |
|    episodes         | 348      |
|    fps              | 2        |
|    time_elapsed     | 2296     |
|    total_timesteps  | 4666     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.38     |
|    n_updates        | 916      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 14.8     |
|    ep_rew_mean      | 14.8     |
|    exploration_rate | 0.0972   |
| time/               |          |
|    episodes         | 352      |
|    fps              | 2        |
|    time_elapsed     | 2325     |
|    total_timesteps  | 4729     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.47     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 16.6     |
|    ep_rew_mean      | 16.6     |
|    exploration_rate | 0.0966   |
| time/               |          |
|    episodes         | 412      |
|    fps              | 2        |
|    time_elapsed     | 2772     |
|    total_timesteps  | 5707     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 8.77     |
|    n_updates        | 1176     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 16.6     |
|    ep_rew_mean      | 16.6     |
|    exploration_rate | 0.0966   |
| time/               |          |
|    episodes         | 416      |
|    fps              | 2        |
|    time_elapsed     | 2801     |
|    total_timesteps  | 5771     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.65     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 16.4     |
|    ep_rew_mean      | 16.4     |
|    exploration_rate | 0.096    |
| time/               |          |
|    episodes         | 476      |
|    fps              | 2        |
|    time_elapsed     | 3256     |
|    total_timesteps  | 6756     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 8.12     |
|    n_updates        | 1438     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 16.6     |
|    ep_rew_mean      | 16.6     |
|    exploration_rate | 0.096    |
| time/               |          |
|    episodes         | 480      |
|    fps              | 2        |
|    time_elapsed     | 3283     |
|    total_timesteps  | 6815     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.16     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 15.1     |
|    ep_rew_mean      | 15.1     |
|    exploration_rate | 0.0954   |
| time/               |          |
|    episodes         | 540      |
|    fps              | 2        |
|    time_elapsed     | 3731     |
|    total_timesteps  | 7787     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.17     |
|    n_updates        | 1696     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 15.6     |
|    ep_rew_mean      | 15.6     |
|    exploration_rate | 0.0953   |
| time/               |          |
|    episodes         | 544      |
|    fps              | 2        |
|    time_elapsed     | 3757     |
|    total_timesteps  | 7842     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.88     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 16.1     |
|    ep_rew_mean      | 16.1     |
|    exploration_rate | 0.0948   |
| time/               |          |
|    episodes         | 604      |
|    fps              | 2        |
|    time_elapsed     | 4205     |
|    total_timesteps  | 8808     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.71     |
|    n_updates        | 1951     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 15.8     |
|    ep_rew_mean      | 15.8     |
|    exploration_rate | 0.0947   |
| time/               |          |
|    episodes         | 608      |
|    fps              | 2        |
|    time_elapsed     | 4232     |
|    total_timesteps  | 8864     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.48     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 17       |
|    ep_rew_mean      | 17       |
|    exploration_rate | 0.0941   |
| time/               |          |
|    episodes         | 668      |
|    fps              | 2        |
|    time_elapsed     | 4718     |
|    total_timesteps  | 9947     |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.72     |
|    n_updates        | 2236     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 16.9     |
|    ep_rew_mean      | 16.9     |
|    exploration_rate | 0.0941   |
| time/               |          |
|    episodes         | 672      |
|    fps              | 2        |
|    time_elapsed     | 4748     |
|    total_timesteps  | 10006    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.95     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 18.7     |
|    ep_rew_mean      | 18.7     |
|    exploration_rate | 0.0934   |
| time/               |          |
|    episodes         | 732      |
|    fps              | 2        |
|    time_elapsed     | 5259     |
|    total_timesteps  | 11175    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.538    |
|    n_updates        | 2543     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 18.8     |
|    ep_rew_mean      | 18.8     |
|    exploration_rate | 0.0933   |
| time/               |          |
|    episodes         | 736      |
|    fps              | 2        |
|    time_elapsed     | 5293     |
|    total_timesteps  | 11253    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.926    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.3     |
|    ep_rew_mean      | 19.3     |
|    exploration_rate | 0.0926   |
| time/               |          |
|    episodes         | 796      |
|    fps              | 2        |
|    time_elapsed     | 5797     |
|    total_timesteps  | 12418    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.5      |
|    n_updates        | 2854     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.8     |
|    ep_rew_mean      | 19.8     |
|    exploration_rate | 0.0926   |
| time/               |          |
|    episodes         | 800      |
|    fps              | 2        |
|    time_elapsed     | 5832     |
|    total_timesteps  | 12502    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.953    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20.3     |
|    ep_rew_mean      | 20.3     |
|    exploration_rate | 0.0919   |
| time/               |          |
|    episodes         | 860      |
|    fps              | 2        |
|    time_elapsed     | 6338     |
|    total_timesteps  | 13681    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.32     |
|    n_updates        | 3170     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20.6     |
|    ep_rew_mean      | 20.6     |
|    exploration_rate | 0.0918   |
| time/               |          |
|    episodes         | 864      |
|    fps              | 2        |
|    time_elapsed     | 6367     |
|    total_timesteps  | 13743    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.39     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.5     |
|    ep_rew_mean      | 19.5     |
|    exploration_rate | 0.0911   |
| time/               |          |
|    episodes         | 924      |
|    fps              | 2        |
|    time_elapsed     | 6889     |
|    total_timesteps  | 14955    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.08     |
|    n_updates        | 3488     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.5     |
|    ep_rew_mean      | 19.5     |
|    exploration_rate | 0.0911   |
| time/               |          |
|    episodes         | 928      |
|    fps              | 2        |
|    time_elapsed     | 6914     |
|    total_timesteps  | 15005    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.31     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.8     |
|    ep_rew_mean      | 19.8     |
|    exploration_rate | 0.0904   |
| time/               |          |
|    episodes         | 988      |
|    fps              | 2        |
|    time_elapsed     | 7452     |
|    total_timesteps  | 16254    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.74     |
|    n_updates        | 3813     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.3     |
|    ep_rew_mean      | 19.3     |
|    exploration_rate | 0.0903   |
| time/               |          |
|    episodes         | 992      |
|    fps              | 2        |
|    time_elapsed     | 7473     |
|    total_timesteps  | 16289    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.35     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20.9     |
|    ep_rew_mean      | 20.9     |
|    exploration_rate | 0.0896   |
| time/               |          |
|    episodes         | 1052     |
|    fps              | 2        |
|    time_elapsed     | 8022     |
|    total_timesteps  | 17570    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.82     |
|    n_updates        | 4142     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20.9     |
|    ep_rew_mean      | 20.9     |
|    exploration_rate | 0.0895   |
| time/               |          |
|    episodes         | 1056     |
|    fps              | 2        |
|    time_elapsed     | 8055     |
|    total_timesteps  | 17645    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.1      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.9     |
|    ep_rew_mean      | 21.9     |
|    exploration_rate | 0.0887   |
| time/               |          |
|    episodes         | 1116     |
|    fps              | 2        |
|    time_elapsed     | 8628     |
|    total_timesteps  | 19004    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.78     |
|    n_updates        | 4500     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.4     |
|    ep_rew_mean      | 21.4     |
|    exploration_rate | 0.0887   |
| time/               |          |
|    episodes         | 1120     |
|    fps              | 2        |
|    time_elapsed     | 8661     |
|    total_timesteps  | 19070    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.08     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.4     |
|    ep_rew_mean      | 19.4     |
|    exploration_rate | 0.0881   |
| time/               |          |
|    episodes         | 1180     |
|    fps              | 2        |
|    time_elapsed     | 9133     |
|    total_timesteps  | 20101    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.57     |
|    n_updates        | 4775     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.3     |
|    ep_rew_mean      | 19.3     |
|    exploration_rate | 0.088    |
| time/               |          |
|    episodes         | 1184     |
|    fps              | 2        |
|    time_elapsed     | 9166     |
|    total_timesteps  | 20173    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.37     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.4     |
|    ep_rew_mean      | 19.4     |
|    exploration_rate | 0.0873   |
| time/               |          |
|    episodes         | 1244     |
|    fps              | 2        |
|    time_elapsed     | 9698     |
|    total_timesteps  | 21429    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.712    |
|    n_updates        | 5107     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.7     |
|    ep_rew_mean      | 19.7     |
|    exploration_rate | 0.0872   |
| time/               |          |
|    episodes         | 1248     |
|    fps              | 2        |
|    time_elapsed     | 9730     |
|    total_timesteps  | 21505    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.94     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.6     |
|    ep_rew_mean      | 19.6     |
|    exploration_rate | 0.0866   |
| time/               |          |
|    episodes         | 1308     |
|    fps              | 2        |
|    time_elapsed     | 10236    |
|    total_timesteps  | 22657    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.683    |
|    n_updates        | 5414     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20       |
|    ep_rew_mean      | 20       |
|    exploration_rate | 0.0865   |
| time/               |          |
|    episodes         | 1312     |
|    fps              | 2        |
|    time_elapsed     | 10275    |
|    total_timesteps  | 22750    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.455    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.8     |
|    ep_rew_mean      | 21.8     |
|    exploration_rate | 0.0856   |
| time/               |          |
|    episodes         | 1372     |
|    fps              | 2        |
|    time_elapsed     | 10872    |
|    total_timesteps  | 24206    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.263    |
|    n_updates        | 5801     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.1     |
|    ep_rew_mean      | 22.1     |
|    exploration_rate | 0.0856   |
| time/               |          |
|    episodes         | 1376     |
|    fps              | 2        |
|    time_elapsed     | 10915    |
|    total_timesteps  | 24314    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.13     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.6     |
|    ep_rew_mean      | 21.6     |
|    exploration_rate | 0.0849   |
| time/               |          |
|    episodes         | 1436     |
|    fps              | 2        |
|    time_elapsed     | 11435    |
|    total_timesteps  | 25518    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.63     |
|    n_updates        | 6129     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.2     |
|    ep_rew_mean      | 21.2     |
|    exploration_rate | 0.0848   |
| time/               |          |
|    episodes         | 1440     |
|    fps              | 2        |
|    time_elapsed     | 11465    |
|    total_timesteps  | 25585    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.58     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.2     |
|    ep_rew_mean      | 21.2     |
|    exploration_rate | 0.084    |
| time/               |          |
|    episodes         | 1500     |
|    fps              | 2        |
|    time_elapsed     | 12041    |
|    total_timesteps  | 26972    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.36     |
|    n_updates        | 6492     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.2     |
|    ep_rew_mean      | 21.2     |
|    exploration_rate | 0.084    |
| time/               |          |
|    episodes         | 1504     |
|    fps              | 2        |
|    time_elapsed     | 12067    |
|    total_timesteps  | 27021    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.45     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.2     |
|    ep_rew_mean      | 22.2     |
|    exploration_rate | 0.0832   |
| time/               |          |
|    episodes         | 1564     |
|    fps              | 2        |
|    time_elapsed     | 12638    |
|    total_timesteps  | 28384    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.86     |
|    n_updates        | 6845     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.8     |
|    ep_rew_mean      | 21.8     |
|    exploration_rate | 0.0831   |
| time/               |          |
|    episodes         | 1568     |
|    fps              | 2        |
|    time_elapsed     | 12668    |
|    total_timesteps  | 28450    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.27     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20.8     |
|    ep_rew_mean      | 20.8     |
|    exploration_rate | 0.0824   |
| time/               |          |
|    episodes         | 1628     |
|    fps              | 2        |
|    time_elapsed     | 13185    |
|    total_timesteps  | 29635    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.83     |
|    n_updates        | 7158     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20.8     |
|    ep_rew_mean      | 20.8     |
|    exploration_rate | 0.0824   |
| time/               |          |
|    episodes         | 1632     |
|    fps              | 2        |
|    time_elapsed     | 13218    |
|    total_timesteps  | 29713    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.706    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19       |
|    ep_rew_mean      | 19       |
|    exploration_rate | 0.0817   |
| time/               |          |
|    episodes         | 1692     |
|    fps              | 2        |
|    time_elapsed     | 13737    |
|    total_timesteps  | 30892    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.95     |
|    n_updates        | 7472     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19       |
|    ep_rew_mean      | 19       |
|    exploration_rate | 0.0816   |
| time/               |          |
|    episodes         | 1696     |
|    fps              | 2        |
|    time_elapsed     | 13768    |
|    total_timesteps  | 30964    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.796    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.9     |
|    ep_rew_mean      | 19.9     |
|    exploration_rate | 0.0809   |
| time/               |          |
|    episodes         | 1756     |
|    fps              | 2        |
|    time_elapsed     | 14288    |
|    total_timesteps  | 32170    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.422    |
|    n_updates        | 7792     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20.3     |
|    ep_rew_mean      | 20.3     |
|    exploration_rate | 0.0809   |
| time/               |          |
|    episodes         | 1760     |
|    fps              | 2        |
|    time_elapsed     | 14325    |
|    total_timesteps  | 32258    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.71     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20.4     |
|    ep_rew_mean      | 20.4     |
|    exploration_rate | 0.0801   |
| time/               |          |
|    episodes         | 1820     |
|    fps              | 2        |
|    time_elapsed     | 14867    |
|    total_timesteps  | 33525    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.7      |
|    n_updates        | 8131     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 20.8     |
|    ep_rew_mean      | 20.8     |
|    exploration_rate | 0.08     |
| time/               |          |
|    episodes         | 1824     |
|    fps              | 2        |
|    time_elapsed     | 14912    |
|    total_timesteps  | 33639    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.03     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23.1     |
|    ep_rew_mean      | 23.1     |
|    exploration_rate | 0.0792   |
| time/               |          |
|    episodes         | 1884     |
|    fps              | 2        |
|    time_elapsed     | 15504    |
|    total_timesteps  | 35071    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.08     |
|    n_updates        | 8517     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23       |
|    ep_rew_mean      | 23       |
|    exploration_rate | 0.0791   |
| time/               |          |
|    episodes         | 1888     |
|    fps              | 2        |
|    time_elapsed     | 15539    |
|    total_timesteps  | 35155    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.9      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.7     |
|    ep_rew_mean      | 22.7     |
|    exploration_rate | 0.0783   |
| time/               |          |
|    episodes         | 1948     |
|    fps              | 2        |
|    time_elapsed     | 16104    |
|    total_timesteps  | 36499    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.94     |
|    n_updates        | 8874     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.5     |
|    ep_rew_mean      | 22.5     |
|    exploration_rate | 0.0783   |
| time/               |          |
|    episodes         | 1952     |
|    fps              | 2        |
|    time_elapsed     | 16138    |
|    total_timesteps  | 36581    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.83     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.5     |
|    ep_rew_mean      | 22.5     |
|    exploration_rate | 0.0775   |
| time/               |          |
|    episodes         | 2012     |
|    fps              | 2        |
|    time_elapsed     | 16702    |
|    total_timesteps  | 37940    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.48     |
|    n_updates        | 9234     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.4     |
|    ep_rew_mean      | 22.4     |
|    exploration_rate | 0.0774   |
| time/               |          |
|    episodes         | 2016     |
|    fps              | 2        |
|    time_elapsed     | 16742    |
|    total_timesteps  | 38036    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.3      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.4     |
|    ep_rew_mean      | 22.4     |
|    exploration_rate | 0.0766   |
| time/               |          |
|    episodes         | 2076     |
|    fps              | 2        |
|    time_elapsed     | 17294    |
|    total_timesteps  | 39355    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.97     |
|    n_updates        | 9588     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.6     |
|    ep_rew_mean      | 22.6     |
|    exploration_rate | 0.0766   |
| time/               |          |
|    episodes         | 2080     |
|    fps              | 2        |
|    time_elapsed     | 17335    |
|    total_timesteps  | 39456    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.04     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.8     |
|    ep_rew_mean      | 24.8     |
|    exploration_rate | 0.0757   |
| time/               |          |
|    episodes         | 2140     |
|    fps              | 2        |
|    time_elapsed     | 17966    |
|    total_timesteps  | 41009    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.39     |
|    n_updates        | 10002    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.5     |
|    ep_rew_mean      | 25.5     |
|    exploration_rate | 0.0756   |
| time/               |          |
|    episodes         | 2144     |
|    fps              | 2        |
|    time_elapsed     | 18011    |
|    total_timesteps  | 41125    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.88     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.6     |
|    ep_rew_mean      | 22.6     |
|    exploration_rate | 0.0749   |
| time/               |          |
|    episodes         | 2204     |
|    fps              | 2        |
|    time_elapsed     | 18508    |
|    total_timesteps  | 42263    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.752    |
|    n_updates        | 10315    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.3     |
|    ep_rew_mean      | 21.3     |
|    exploration_rate | 0.0749   |
| time/               |          |
|    episodes         | 2208     |
|    fps              | 2        |
|    time_elapsed     | 18525    |
|    total_timesteps  | 42288    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.15     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.9     |
|    ep_rew_mean      | 19.9     |
|    exploration_rate | 0.0742   |
| time/               |          |
|    episodes         | 2268     |
|    fps              | 2        |
|    time_elapsed     | 19058    |
|    total_timesteps  | 43541    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.4      |
|    n_updates        | 10635    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.7     |
|    ep_rew_mean      | 19.7     |
|    exploration_rate | 0.0741   |
| time/               |          |
|    episodes         | 2272     |
|    fps              | 2        |
|    time_elapsed     | 19088    |
|    total_timesteps  | 43606    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.89     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22       |
|    ep_rew_mean      | 22       |
|    exploration_rate | 0.0733   |
| time/               |          |
|    episodes         | 2332     |
|    fps              | 2        |
|    time_elapsed     | 19666    |
|    total_timesteps  | 44997    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.87     |
|    n_updates        | 10999    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.5     |
|    ep_rew_mean      | 21.5     |
|    exploration_rate | 0.0733   |
| time/               |          |
|    episodes         | 2336     |
|    fps              | 2        |
|    time_elapsed     | 19692    |
|    total_timesteps  | 45050    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.92     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.3     |
|    ep_rew_mean      | 21.3     |
|    exploration_rate | 0.0725   |
| time/               |          |
|    episodes         | 2396     |
|    fps              | 2        |
|    time_elapsed     | 20240    |
|    total_timesteps  | 46360    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.96     |
|    n_updates        | 11339    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.1     |
|    ep_rew_mean      | 21.1     |
|    exploration_rate | 0.0724   |
| time/               |          |
|    episodes         | 2400     |
|    fps              | 2        |
|    time_elapsed     | 20272    |
|    total_timesteps  | 46434    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.92     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23.1     |
|    ep_rew_mean      | 23.1     |
|    exploration_rate | 0.0716   |
| time/               |          |
|    episodes         | 2460     |
|    fps              | 2        |
|    time_elapsed     | 20853    |
|    total_timesteps  | 47841    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.351    |
|    n_updates        | 11710    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.9     |
|    ep_rew_mean      | 22.9     |
|    exploration_rate | 0.0716   |
| time/               |          |
|    episodes         | 2464     |
|    fps              | 2        |
|    time_elapsed     | 20885    |
|    total_timesteps  | 47913    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.08     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.1     |
|    ep_rew_mean      | 26.1     |
|    exploration_rate | 0.0706   |
| time/               |          |
|    episodes         | 2524     |
|    fps              | 2        |
|    time_elapsed     | 21553    |
|    total_timesteps  | 49584    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.18     |
|    n_updates        | 12145    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25       |
|    ep_rew_mean      | 25       |
|    exploration_rate | 0.0706   |
| time/               |          |
|    episodes         | 2528     |
|    fps              | 2        |
|    time_elapsed     | 21570    |
|    total_timesteps  | 49604    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.02     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.1     |
|    ep_rew_mean      | 24.1     |
|    exploration_rate | 0.0698   |
| time/               |          |
|    episodes         | 2588     |
|    fps              | 2        |
|    time_elapsed     | 22120    |
|    total_timesteps  | 50898    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.93     |
|    n_updates        | 12474    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23.4     |
|    ep_rew_mean      | 23.4     |
|    exploration_rate | 0.0697   |
| time/               |          |
|    episodes         | 2592     |
|    fps              | 2        |
|    time_elapsed     | 22150    |
|    total_timesteps  | 50964    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.82     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 18.8     |
|    ep_rew_mean      | 18.8     |
|    exploration_rate | 0.0691   |
| time/               |          |
|    episodes         | 2652     |
|    fps              | 2        |
|    time_elapsed     | 22647    |
|    total_timesteps  | 52089    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.26     |
|    n_updates        | 12772    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 18.8     |
|    ep_rew_mean      | 18.8     |
|    exploration_rate | 0.069    |
| time/               |          |
|    episodes         | 2656     |
|    fps              | 2        |
|    time_elapsed     | 22686    |
|    total_timesteps  | 52180    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.4      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 17.8     |
|    ep_rew_mean      | 17.8     |
|    exploration_rate | 0.0684   |
| time/               |          |
|    episodes         | 2716     |
|    fps              | 2        |
|    time_elapsed     | 23179    |
|    total_timesteps  | 53281    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 8.43     |
|    n_updates        | 13070    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 18.3     |
|    ep_rew_mean      | 18.3     |
|    exploration_rate | 0.0683   |
| time/               |          |
|    episodes         | 2720     |
|    fps              | 2        |
|    time_elapsed     | 23223    |
|    total_timesteps  | 53393    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.4      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.7     |
|    ep_rew_mean      | 19.7     |
|    exploration_rate | 0.0676   |
| time/               |          |
|    episodes         | 2780     |
|    fps              | 2        |
|    time_elapsed     | 23766    |
|    total_timesteps  | 54655    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.36     |
|    n_updates        | 13413    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 19.9     |
|    ep_rew_mean      | 19.9     |
|    exploration_rate | 0.0675   |
| time/               |          |
|    episodes         | 2784     |
|    fps              | 2        |
|    time_elapsed     | 23796    |
|    total_timesteps  | 54724    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.43     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.1     |
|    ep_rew_mean      | 21.1     |
|    exploration_rate | 0.0667   |
| time/               |          |
|    episodes         | 2844     |
|    fps              | 2        |
|    time_elapsed     | 24361    |
|    total_timesteps  | 56076    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.67     |
|    n_updates        | 13768    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21       |
|    ep_rew_mean      | 21       |
|    exploration_rate | 0.0667   |
| time/               |          |
|    episodes         | 2848     |
|    fps              | 2        |
|    time_elapsed     | 24397    |
|    total_timesteps  | 56164    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.74     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22       |
|    ep_rew_mean      | 22       |
|    exploration_rate | 0.0659   |
| time/               |          |
|    episodes         | 2908     |
|    fps              | 2        |
|    time_elapsed     | 24951    |
|    total_timesteps  | 57480    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.521    |
|    n_updates        | 14119    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23       |
|    ep_rew_mean      | 23       |
|    exploration_rate | 0.0658   |
| time/               |          |
|    episodes         | 2912     |
|    fps              | 2        |
|    time_elapsed     | 25012    |
|    total_timesteps  | 57647    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.89     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.4     |
|    ep_rew_mean      | 24.4     |
|    exploration_rate | 0.0649   |
| time/               |          |
|    episodes         | 2972     |
|    fps              | 2        |
|    time_elapsed     | 25593    |
|    total_timesteps  | 59065    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.09     |
|    n_updates        | 14516    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.4     |
|    ep_rew_mean      | 24.4     |
|    exploration_rate | 0.0649   |
| time/               |          |
|    episodes         | 2976     |
|    fps              | 2        |
|    time_elapsed     | 25624    |
|    total_timesteps  | 59133    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.31     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.7     |
|    ep_rew_mean      | 25.7     |
|    exploration_rate | 0.064    |
| time/               |          |
|    episodes         | 3036     |
|    fps              | 2        |
|    time_elapsed     | 26262    |
|    total_timesteps  | 60725    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.65     |
|    n_updates        | 14931    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.7     |
|    ep_rew_mean      | 25.7     |
|    exploration_rate | 0.0639   |
| time/               |          |
|    episodes         | 3040     |
|    fps              | 2        |
|    time_elapsed     | 26297    |
|    total_timesteps  | 60809    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.87     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.3     |
|    ep_rew_mean      | 26.3     |
|    exploration_rate | 0.0629   |
| time/               |          |
|    episodes         | 3100     |
|    fps              | 2        |
|    time_elapsed     | 26943    |
|    total_timesteps  | 62440    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.54     |
|    n_updates        | 15359    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 27.3     |
|    ep_rew_mean      | 27.3     |
|    exploration_rate | 0.0628   |
| time/               |          |
|    episodes         | 3104     |
|    fps              | 2        |
|    time_elapsed     | 27011    |
|    total_timesteps  | 62627    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.665    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.3     |
|    ep_rew_mean      | 26.3     |
|    exploration_rate | 0.062    |
| time/               |          |
|    episodes         | 3164     |
|    fps              | 2        |
|    time_elapsed     | 27616    |
|    total_timesteps  | 64102    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.5      |
|    n_updates        | 15775    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.1     |
|    ep_rew_mean      | 25.1     |
|    exploration_rate | 0.0619   |
| time/               |          |
|    episodes         | 3168     |
|    fps              | 2        |
|    time_elapsed     | 27639    |
|    total_timesteps  | 64148    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.1      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.3     |
|    ep_rew_mean      | 26.3     |
|    exploration_rate | 0.061    |
| time/               |          |
|    episodes         | 3228     |
|    fps              | 2        |
|    time_elapsed     | 28259    |
|    total_timesteps  | 65688    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.55     |
|    n_updates        | 16171    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.4     |
|    ep_rew_mean      | 25.4     |
|    exploration_rate | 0.061    |
| time/               |          |
|    episodes         | 3232     |
|    fps              | 2        |
|    time_elapsed     | 28289    |
|    total_timesteps  | 65754    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.19     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.7     |
|    ep_rew_mean      | 25.7     |
|    exploration_rate | 0.0601   |
| time/               |          |
|    episodes         | 3292     |
|    fps              | 2        |
|    time_elapsed     | 28887    |
|    total_timesteps  | 67230    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.78     |
|    n_updates        | 16557    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.4     |
|    ep_rew_mean      | 25.4     |
|    exploration_rate | 0.06     |
| time/               |          |
|    episodes         | 3296     |
|    fps              | 2        |
|    time_elapsed     | 28925    |
|    total_timesteps  | 67324    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.14     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.7     |
|    ep_rew_mean      | 24.7     |
|    exploration_rate | 0.0592   |
| time/               |          |
|    episodes         | 3356     |
|    fps              | 2        |
|    time_elapsed     | 29530    |
|    total_timesteps  | 68807    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 6.37     |
|    n_updates        | 16951    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25       |
|    ep_rew_mean      | 25       |
|    exploration_rate | 0.0591   |
| time/               |          |
|    episodes         | 3360     |
|    fps              | 2        |
|    time_elapsed     | 29588    |
|    total_timesteps  | 68964    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.35     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29.9     |
|    ep_rew_mean      | 29.9     |
|    exploration_rate | 0.0579   |
| time/               |          |
|    episodes         | 3420     |
|    fps              | 2        |
|    time_elapsed     | 30323    |
|    total_timesteps  | 70847    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.05     |
|    n_updates        | 17461    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29.6     |
|    ep_rew_mean      | 29.6     |
|    exploration_rate | 0.0579   |
| time/               |          |
|    episodes         | 3424     |
|    fps              | 2        |
|    time_elapsed     | 30360    |
|    total_timesteps  | 70933    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.37     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29.1     |
|    ep_rew_mean      | 29.1     |
|    exploration_rate | 0.0569   |
| time/               |          |
|    episodes         | 3484     |
|    fps              | 2        |
|    time_elapsed     | 31045    |
|    total_timesteps  | 72653    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.14     |
|    n_updates        | 17913    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.9     |
|    ep_rew_mean      | 28.9     |
|    exploration_rate | 0.0568   |
| time/               |          |
|    episodes         | 3488     |
|    fps              | 2        |
|    time_elapsed     | 31071    |
|    total_timesteps  | 72705    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.619    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.6     |
|    ep_rew_mean      | 26.6     |
|    exploration_rate | 0.056    |
| time/               |          |
|    episodes         | 3548     |
|    fps              | 2        |
|    time_elapsed     | 31686    |
|    total_timesteps  | 74203    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.403    |
|    n_updates        | 18300    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.8     |
|    ep_rew_mean      | 26.8     |
|    exploration_rate | 0.0559   |
| time/               |          |
|    episodes         | 3552     |
|    fps              | 2        |
|    time_elapsed     | 31725    |
|    total_timesteps  | 74297    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.51     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.8     |
|    ep_rew_mean      | 25.8     |
|    exploration_rate | 0.055    |
| time/               |          |
|    episodes         | 3612     |
|    fps              | 2        |
|    time_elapsed     | 32348    |
|    total_timesteps  | 75832    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.81     |
|    n_updates        | 18707    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.6     |
|    ep_rew_mean      | 25.6     |
|    exploration_rate | 0.0549   |
| time/               |          |
|    episodes         | 3616     |
|    fps              | 2        |
|    time_elapsed     | 32382    |
|    total_timesteps  | 75909    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.74     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.3     |
|    ep_rew_mean      | 25.3     |
|    exploration_rate | 0.054    |
| time/               |          |
|    episodes         | 3676     |
|    fps              | 2        |
|    time_elapsed     | 33016    |
|    total_timesteps  | 77479    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.878    |
|    n_updates        | 19119    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.3     |
|    ep_rew_mean      | 25.3     |
|    exploration_rate | 0.054    |
| time/               |          |
|    episodes         | 3680     |
|    fps              | 2        |
|    time_elapsed     | 33055    |
|    total_timesteps  | 77573    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.334    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.6     |
|    ep_rew_mean      | 25.6     |
|    exploration_rate | 0.0531   |
| time/               |          |
|    episodes         | 3740     |
|    fps              | 2        |
|    time_elapsed     | 33667    |
|    total_timesteps  | 79089    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.242    |
|    n_updates        | 19522    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.6     |
|    ep_rew_mean      | 25.6     |
|    exploration_rate | 0.053    |
| time/               |          |
|    episodes         | 3744     |
|    fps              | 2        |
|    time_elapsed     | 33706    |
|    total_timesteps  | 79183    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.47     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.9     |
|    ep_rew_mean      | 25.9     |
|    exploration_rate | 0.052    |
| time/               |          |
|    episodes         | 3804     |
|    fps              | 2        |
|    time_elapsed     | 34369    |
|    total_timesteps  | 80852    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.576    |
|    n_updates        | 19962    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26       |
|    ep_rew_mean      | 26       |
|    exploration_rate | 0.052    |
| time/               |          |
|    episodes         | 3808     |
|    fps              | 2        |
|    time_elapsed     | 34396    |
|    total_timesteps  | 80906    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.23     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.1     |
|    ep_rew_mean      | 25.1     |
|    exploration_rate | 0.0511   |
| time/               |          |
|    episodes         | 3868     |
|    fps              | 2        |
|    time_elapsed     | 35000    |
|    total_timesteps  | 82375    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.18     |
|    n_updates        | 20343    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.8     |
|    ep_rew_mean      | 24.8     |
|    exploration_rate | 0.0511   |
| time/               |          |
|    episodes         | 3872     |
|    fps              | 2        |
|    time_elapsed     | 35031    |
|    total_timesteps  | 82444    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.39     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 27.6     |
|    ep_rew_mean      | 27.6     |
|    exploration_rate | 0.05     |
| time/               |          |
|    episodes         | 3932     |
|    fps              | 2        |
|    time_elapsed     | 35741    |
|    total_timesteps  | 84256    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.09     |
|    n_updates        | 20813    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.3     |
|    ep_rew_mean      | 28.3     |
|    exploration_rate | 0.0499   |
| time/               |          |
|    episodes         | 3936     |
|    fps              | 2        |
|    time_elapsed     | 35792    |
|    total_timesteps  | 84389    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.812    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.4     |
|    ep_rew_mean      | 26.4     |
|    exploration_rate | 0.0491   |
| time/               |          |
|    episodes         | 3996     |
|    fps              | 2        |
|    time_elapsed     | 36378    |
|    total_timesteps  | 85804    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.366    |
|    n_updates        | 21200    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.2     |
|    ep_rew_mean      | 26.2     |
|    exploration_rate | 0.049    |
| time/               |          |
|    episodes         | 4000     |
|    fps              | 2        |
|    time_elapsed     | 36411    |
|    total_timesteps  | 85878    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.21     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.4     |
|    ep_rew_mean      | 25.4     |
|    exploration_rate | 0.048    |
| time/               |          |
|    episodes         | 4060     |
|    fps              | 2        |
|    time_elapsed     | 37101    |
|    total_timesteps  | 87633    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.84     |
|    n_updates        | 21658    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.5     |
|    ep_rew_mean      | 25.5     |
|    exploration_rate | 0.0479   |
| time/               |          |
|    episodes         | 4064     |
|    fps              | 2        |
|    time_elapsed     | 37128    |
|    total_timesteps  | 87693    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 7.92     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 32.5     |
|    ep_rew_mean      | 32.5     |
|    exploration_rate | 0.0467   |
| time/               |          |
|    episodes         | 4124     |
|    fps              | 2        |
|    time_elapsed     | 37941    |
|    total_timesteps  | 89841    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.12     |
|    n_updates        | 22210    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 33.1     |
|    ep_rew_mean      | 33.1     |
|    exploration_rate | 0.0466   |
| time/               |          |
|    episodes         | 4128     |
|    fps              | 2        |
|    time_elapsed     | 37993    |
|    total_timesteps  | 89975    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.57     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 30       |
|    ep_rew_mean      | 30       |
|    exploration_rate | 0.0456   |
| time/               |          |
|    episodes         | 4188     |
|    fps              | 2        |
|    time_elapsed     | 38634    |
|    total_timesteps  | 91581    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.852    |
|    n_updates        | 22645    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29.7     |
|    ep_rew_mean      | 29.7     |
|    exploration_rate | 0.0456   |
| time/               |          |
|    episodes         | 4192     |
|    fps              | 2        |
|    time_elapsed     | 38677    |
|    total_timesteps  | 91687    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.68     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.5     |
|    ep_rew_mean      | 28.5     |
|    exploration_rate | 0.0445   |
| time/               |          |
|    episodes         | 4252     |
|    fps              | 2        |
|    time_elapsed     | 39384    |
|    total_timesteps  | 93492    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 7.48     |
|    n_updates        | 23122    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.5     |
|    ep_rew_mean      | 28.5     |
|    exploration_rate | 0.0445   |
| time/               |          |
|    episodes         | 4256     |
|    fps              | 2        |
|    time_elapsed     | 39416    |
|    total_timesteps  | 93565    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.958    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.6     |
|    ep_rew_mean      | 26.6     |
|    exploration_rate | 0.0435   |
| time/               |          |
|    episodes         | 4316     |
|    fps              | 2        |
|    time_elapsed     | 40083    |
|    total_timesteps  | 95255    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.11     |
|    n_updates        | 23563    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 27.3     |
|    ep_rew_mean      | 27.3     |
|    exploration_rate | 0.0434   |
| time/               |          |
|    episodes         | 4320     |
|    fps              | 2        |
|    time_elapsed     | 40128    |
|    total_timesteps  | 95364    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.12     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.8     |
|    ep_rew_mean      | 24.8     |
|    exploration_rate | 0.0425   |
| time/               |          |
|    episodes         | 4380     |
|    fps              | 2        |
|    time_elapsed     | 40726    |
|    total_timesteps  | 96817    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.05     |
|    n_updates        | 23954    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.4     |
|    ep_rew_mean      | 24.4     |
|    exploration_rate | 0.0425   |
| time/               |          |
|    episodes         | 4384     |
|    fps              | 2        |
|    time_elapsed     | 40756    |
|    total_timesteps  | 96876    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.431    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.3     |
|    ep_rew_mean      | 24.3     |
|    exploration_rate | 0.0416   |
| time/               |          |
|    episodes         | 4444     |
|    fps              | 2        |
|    time_elapsed     | 41346    |
|    total_timesteps  | 98304    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.68     |
|    n_updates        | 24325    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23.7     |
|    ep_rew_mean      | 23.7     |
|    exploration_rate | 0.0416   |
| time/               |          |
|    episodes         | 4448     |
|    fps              | 2        |
|    time_elapsed     | 41382    |
|    total_timesteps  | 98390    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.997    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.6     |
|    ep_rew_mean      | 25.6     |
|    exploration_rate | 0.0406   |
| time/               |          |
|    episodes         | 4508     |
|    fps              | 2        |
|    time_elapsed     | 42032    |
|    total_timesteps  | 99997    |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.371    |
|    n_updates        | 24749    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.7     |
|    ep_rew_mean      | 25.7     |
|    exploration_rate | 0.0406   |
| time/               |          |
|    episodes         | 4512     |
|    fps              | 2        |
|    time_elapsed     | 42066    |
|    total_timesteps  | 100074   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.792    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29.8     |
|    ep_rew_mean      | 29.8     |
|    exploration_rate | 0.0395   |
| time/               |          |
|    episodes         | 4572     |
|    fps              | 2        |
|    time_elapsed     | 42812    |
|    total_timesteps  | 101974   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.72     |
|    n_updates        | 25243    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.9     |
|    ep_rew_mean      | 28.9     |
|    exploration_rate | 0.0394   |
| time/               |          |
|    episodes         | 4576     |
|    fps              | 2        |
|    time_elapsed     | 42837    |
|    total_timesteps  | 102019   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.451    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.4     |
|    ep_rew_mean      | 25.4     |
|    exploration_rate | 0.0386   |
| time/               |          |
|    episodes         | 4636     |
|    fps              | 2        |
|    time_elapsed     | 43424    |
|    total_timesteps  | 103397   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.07     |
|    n_updates        | 25599    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.4     |
|    ep_rew_mean      | 25.4     |
|    exploration_rate | 0.0386   |
| time/               |          |
|    episodes         | 4640     |
|    fps              | 2        |
|    time_elapsed     | 43458    |
|    total_timesteps  | 103475   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.2      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.7     |
|    ep_rew_mean      | 22.7     |
|    exploration_rate | 0.0377   |
| time/               |          |
|    episodes         | 4700     |
|    fps              | 2        |
|    time_elapsed     | 44069    |
|    total_timesteps  | 104952   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.292    |
|    n_updates        | 25987    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23.4     |
|    ep_rew_mean      | 23.4     |
|    exploration_rate | 0.0376   |
| time/               |          |
|    episodes         | 4704     |
|    fps              | 2        |
|    time_elapsed     | 44127    |
|    total_timesteps  | 105104   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.284    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 33       |
|    ep_rew_mean      | 33       |
|    exploration_rate | 0.0362   |
| time/               |          |
|    episodes         | 4764     |
|    fps              | 2        |
|    time_elapsed     | 44999    |
|    total_timesteps  | 107442   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.484    |
|    n_updates        | 26610    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 33.4     |
|    ep_rew_mean      | 33.4     |
|    exploration_rate | 0.0361   |
| time/               |          |
|    episodes         | 4768     |
|    fps              | 2        |
|    time_elapsed     | 45054    |
|    total_timesteps  | 107586   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.6      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 30.5     |
|    ep_rew_mean      | 30.5     |
|    exploration_rate | 0.0352   |
| time/               |          |
|    episodes         | 4828     |
|    fps              | 2        |
|    time_elapsed     | 45714    |
|    total_timesteps  | 109249   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.88     |
|    n_updates        | 27062    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 30.8     |
|    ep_rew_mean      | 30.8     |
|    exploration_rate | 0.0351   |
| time/               |          |
|    episodes         | 4832     |
|    fps              | 2        |
|    time_elapsed     | 45760    |
|    total_timesteps  | 109362   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 2.37     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 35.2     |
|    ep_rew_mean      | 35.2     |
|    exploration_rate | 0.0337   |
| time/               |          |
|    episodes         | 4892     |
|    fps              | 2        |
|    time_elapsed     | 46639    |
|    total_timesteps  | 111718   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.31     |
|    n_updates        | 27679    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 37.1     |
|    ep_rew_mean      | 37.1     |
|    exploration_rate | 0.0335   |
| time/               |          |
|    episodes         | 4896     |
|    fps              | 2        |
|    time_elapsed     | 46731    |
|    total_timesteps  | 111980   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.549    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 37       |
|    ep_rew_mean      | 37       |
|    exploration_rate | 0.0324   |
| time/               |          |
|    episodes         | 4956     |
|    fps              | 2        |
|    time_elapsed     | 47454    |
|    total_timesteps  | 113825   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 8.28     |
|    n_updates        | 28206    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 36.7     |
|    ep_rew_mean      | 36.7     |
|    exploration_rate | 0.0324   |
| time/               |          |
|    episodes         | 4960     |
|    fps              | 2        |
|    time_elapsed     | 47496    |
|    total_timesteps  | 113926   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.698    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 30.4     |
|    ep_rew_mean      | 30.4     |
|    exploration_rate | 0.0312   |
| time/               |          |
|    episodes         | 5020     |
|    fps              | 2        |
|    time_elapsed     | 48247    |
|    total_timesteps  | 115871   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.188    |
|    n_updates        | 28717    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 30.4     |
|    ep_rew_mean      | 30.4     |
|    exploration_rate | 0.0312   |
| time/               |          |
|    episodes         | 5024     |
|    fps              | 2        |
|    time_elapsed     | 48278    |
|    total_timesteps  | 115940   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.2      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 34       |
|    ep_rew_mean      | 34       |
|    exploration_rate | 0.03     |
| time/               |          |
|    episodes         | 5084     |
|    fps              | 2        |
|    time_elapsed     | 49068    |
|    total_timesteps  | 118007   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.153    |
|    n_updates        | 29251    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 35       |
|    ep_rew_mean      | 35       |
|    exploration_rate | 0.0299   |
| time/               |          |
|    episodes         | 5088     |
|    fps              | 2        |
|    time_elapsed     | 49132    |
|    total_timesteps  | 118179   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.489    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 34.3     |
|    ep_rew_mean      | 34.3     |
|    exploration_rate | 0.0287   |
| time/               |          |
|    episodes         | 5148     |
|    fps              | 2        |
|    time_elapsed     | 49908    |
|    total_timesteps  | 120181   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.236    |
|    n_updates        | 29795    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 33.7     |
|    ep_rew_mean      | 33.7     |
|    exploration_rate | 0.0286   |
| time/               |          |
|    episodes         | 5152     |
|    fps              | 2        |
|    time_elapsed     | 49967    |
|    total_timesteps  | 120340   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.394    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.3     |
|    ep_rew_mean      | 28.3     |
|    exploration_rate | 0.0276   |
| time/               |          |
|    episodes         | 5212     |
|    fps              | 2        |
|    time_elapsed     | 50601    |
|    total_timesteps  | 121892   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.33     |
|    n_updates        | 30222    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29.1     |
|    ep_rew_mean      | 29.1     |
|    exploration_rate | 0.0276   |
| time/               |          |
|    episodes         | 5216     |
|    fps              | 2        |
|    time_elapsed     | 50657    |
|    total_timesteps  | 122038   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.42     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.5     |
|    ep_rew_mean      | 28.5     |
|    exploration_rate | 0.0265   |
| time/               |          |
|    episodes         | 5276     |
|    fps              | 2        |
|    time_elapsed     | 51344    |
|    total_timesteps  | 123770   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.84     |
|    n_updates        | 30692    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 27.8     |
|    ep_rew_mean      | 27.8     |
|    exploration_rate | 0.0265   |
| time/               |          |
|    episodes         | 5280     |
|    fps              | 2        |
|    time_elapsed     | 51370    |
|    total_timesteps  | 123818   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.73     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26       |
|    ep_rew_mean      | 26       |
|    exploration_rate | 0.0256   |
| time/               |          |
|    episodes         | 5340     |
|    fps              | 2        |
|    time_elapsed     | 51985    |
|    total_timesteps  | 125343   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.672    |
|    n_updates        | 31085    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.8     |
|    ep_rew_mean      | 25.8     |
|    exploration_rate | 0.0255   |
| time/               |          |
|    episodes         | 5344     |
|    fps              | 2        |
|    time_elapsed     | 52027    |
|    total_timesteps  | 125446   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.6      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.6     |
|    ep_rew_mean      | 25.6     |
|    exploration_rate | 0.0246   |
| time/               |          |
|    episodes         | 5404     |
|    fps              | 2        |
|    time_elapsed     | 52666    |
|    total_timesteps  | 127025   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.217    |
|    n_updates        | 31506    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.2     |
|    ep_rew_mean      | 25.2     |
|    exploration_rate | 0.0246   |
| time/               |          |
|    episodes         | 5408     |
|    fps              | 2        |
|    time_elapsed     | 52701    |
|    total_timesteps  | 127104   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.317    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25.8     |
|    ep_rew_mean      | 25.8     |
|    exploration_rate | 0.0236   |
| time/               |          |
|    episodes         | 5468     |
|    fps              | 2        |
|    time_elapsed     | 53330    |
|    total_timesteps  | 128650   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.477    |
|    n_updates        | 31912    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.8     |
|    ep_rew_mean      | 24.8     |
|    exploration_rate | 0.0236   |
| time/               |          |
|    episodes         | 5472     |
|    fps              | 2        |
|    time_elapsed     | 53369    |
|    total_timesteps  | 128743   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.61     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.2     |
|    ep_rew_mean      | 21.2     |
|    exploration_rate | 0.0228   |
| time/               |          |
|    episodes         | 5532     |
|    fps              | 2        |
|    time_elapsed     | 53915    |
|    total_timesteps  | 130004   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.07     |
|    n_updates        | 32250    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 21.6     |
|    ep_rew_mean      | 21.6     |
|    exploration_rate | 0.0227   |
| time/               |          |
|    episodes         | 5536     |
|    fps              | 2        |
|    time_elapsed     | 53971    |
|    total_timesteps  | 130156   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.24     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.2     |
|    ep_rew_mean      | 28.2     |
|    exploration_rate | 0.0216   |
| time/               |          |
|    episodes         | 5596     |
|    fps              | 2        |
|    time_elapsed     | 54722    |
|    total_timesteps  | 132070   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.161    |
|    n_updates        | 32767    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.9     |
|    ep_rew_mean      | 28.9     |
|    exploration_rate | 0.0215   |
| time/               |          |
|    episodes         | 5600     |
|    fps              | 2        |
|    time_elapsed     | 54779    |
|    total_timesteps  | 132224   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.303    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 31.4     |
|    ep_rew_mean      | 31.4     |
|    exploration_rate | 0.0203   |
| time/               |          |
|    episodes         | 5660     |
|    fps              | 2        |
|    time_elapsed     | 55587    |
|    total_timesteps  | 134319   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.171    |
|    n_updates        | 33329    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 30.8     |
|    ep_rew_mean      | 30.8     |
|    exploration_rate | 0.0202   |
| time/               |          |
|    episodes         | 5664     |
|    fps              | 2        |
|    time_elapsed     | 55637    |
|    total_timesteps  | 134449   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.298    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 36.5     |
|    ep_rew_mean      | 36.5     |
|    exploration_rate | 0.0191   |
| time/               |          |
|    episodes         | 5724     |
|    fps              | 2        |
|    time_elapsed     | 56355    |
|    total_timesteps  | 136288   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.78     |
|    n_updates        | 33821    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 36.2     |
|    ep_rew_mean      | 36.2     |
|    exploration_rate | 0.0191   |
| time/               |          |
|    episodes         | 5728     |
|    fps              | 2        |
|    time_elapsed     | 56386    |
|    total_timesteps  | 136360   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.347    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 32.7     |
|    ep_rew_mean      | 32.7     |
|    exploration_rate | 0.0179   |
| time/               |          |
|    episodes         | 5788     |
|    fps              | 2        |
|    time_elapsed     | 57139    |
|    total_timesteps  | 138280   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 11.3     |
|    n_updates        | 34319    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 33       |
|    ep_rew_mean      | 33       |
|    exploration_rate | 0.0179   |
| time/               |          |
|    episodes         | 5792     |
|    fps              | 2        |
|    time_elapsed     | 57178    |
|    total_timesteps  | 138369   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3.83     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 34.3     |
|    ep_rew_mean      | 34.3     |
|    exploration_rate | 0.0167   |
| time/               |          |
|    episodes         | 5852     |
|    fps              | 2        |
|    time_elapsed     | 57963    |
|    total_timesteps  | 140400   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.275    |
|    n_updates        | 34849    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 35.2     |
|    ep_rew_mean      | 35.2     |
|    exploration_rate | 0.0165   |
| time/               |          |
|    episodes         | 5856     |
|    fps              | 2        |
|    time_elapsed     | 58045    |
|    total_timesteps  | 140632   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.487    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 31       |
|    ep_rew_mean      | 31       |
|    exploration_rate | 0.0155   |
| time/               |          |
|    episodes         | 5916     |
|    fps              | 2        |
|    time_elapsed     | 58728    |
|    total_timesteps  | 142330   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 10.8     |
|    n_updates        | 35332    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 31.5     |
|    ep_rew_mean      | 31.5     |
|    exploration_rate | 0.0154   |
| time/               |          |
|    episodes         | 5920     |
|    fps              | 2        |
|    time_elapsed     | 58781    |
|    total_timesteps  | 142464   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 8.2      |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 27.6     |
|    ep_rew_mean      | 27.6     |
|    exploration_rate | 0.0145   |
| time/               |          |
|    episodes         | 5980     |
|    fps              | 2        |
|    time_elapsed     | 59421    |
|    total_timesteps  | 144031   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.226    |
|    n_updates        | 35757    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 27.5     |
|    ep_rew_mean      | 27.5     |
|    exploration_rate | 0.0145   |
| time/               |          |
|    episodes         | 5984     |
|    fps              | 2        |
|    time_elapsed     | 59439    |
|    total_timesteps  | 144064   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 15.3     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.2     |
|    ep_rew_mean      | 26.2     |
|    exploration_rate | 0.0135   |
| time/               |          |
|    episodes         | 6044     |
|    fps              | 2        |
|    time_elapsed     | 60100    |
|    total_timesteps  | 145697   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.784    |
|    n_updates        | 36174    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 26.7     |
|    ep_rew_mean      | 26.7     |
|    exploration_rate | 0.0134   |
| time/               |          |
|    episodes         | 6048     |
|    fps              | 2        |
|    time_elapsed     | 60161    |
|    total_timesteps  | 145860   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.72     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29.9     |
|    ep_rew_mean      | 29.9     |
|    exploration_rate | 0.0124   |
| time/               |          |
|    episodes         | 6108     |
|    fps              | 2        |
|    time_elapsed     | 60864    |
|    total_timesteps  | 147636   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.533    |
|    n_updates        | 36658    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29.3     |
|    ep_rew_mean      | 29.3     |
|    exploration_rate | 0.0123   |
| time/               |          |
|    episodes         | 6112     |
|    fps              | 2        |
|    time_elapsed     | 60896    |
|    total_timesteps  | 147707   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.136    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 32.4     |
|    ep_rew_mean      | 32.4     |
|    exploration_rate | 0.0111   |
| time/               |          |
|    episodes         | 6172     |
|    fps              | 2        |
|    time_elapsed     | 61664    |
|    total_timesteps  | 149698   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.66     |
|    n_updates        | 37174    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 30.6     |
|    ep_rew_mean      | 30.6     |
|    exploration_rate | 0.0111   |
| time/               |          |
|    episodes         | 6176     |
|    fps              | 2        |
|    time_elapsed     | 61721    |
|    total_timesteps  | 149848   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 3        |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.4     |
|    ep_rew_mean      | 28.4     |
|    exploration_rate | 0.0101   |
| time/               |          |
|    episodes         | 6236     |
|    fps              | 2        |
|    time_elapsed     | 62344    |
|    total_timesteps  | 151369   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.47     |
|    n_updates        | 37592    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.7     |
|    ep_rew_mean      | 28.7     |
|    exploration_rate | 0.0101   |
| time/               |          |
|    episodes         | 6240     |
|    fps              | 2        |
|    time_elapsed     | 62383    |
|    total_timesteps  | 151460   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 6.47     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.6     |
|    ep_rew_mean      | 28.6     |
|    exploration_rate | 0.00905  |
| time/               |          |
|    episodes         | 6300     |
|    fps              | 2        |
|    time_elapsed     | 63078    |
|    total_timesteps  | 153224   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.0958   |
|    n_updates        | 38055    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.5     |
|    ep_rew_mean      | 28.5     |
|    exploration_rate | 0.00899  |
| time/               |          |
|    episodes         | 6304     |
|    fps              | 2        |
|    time_elapsed     | 63119    |
|    total_timesteps  | 153321   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.53     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23.2     |
|    ep_rew_mean      | 23.2     |
|    exploration_rate | 0.0083   |
| time/               |          |
|    episodes         | 6364     |
|    fps              | 2        |
|    time_elapsed     | 63626    |
|    total_timesteps  | 154479   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.3      |
|    n_updates        | 38369    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.9     |
|    ep_rew_mean      | 22.9     |
|    exploration_rate | 0.00824  |
| time/               |          |
|    episodes         | 6368     |
|    fps              | 2        |
|    time_elapsed     | 63670    |
|    total_timesteps  | 154593   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.413    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23.4     |
|    ep_rew_mean      | 23.4     |
|    exploration_rate | 0.00739  |
| time/               |          |
|    episodes         | 6428     |
|    fps              | 2        |
|    time_elapsed     | 64252    |
|    total_timesteps  | 156011   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.06     |
|    n_updates        | 38752    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23.4     |
|    ep_rew_mean      | 23.4     |
|    exploration_rate | 0.00735  |
| time/               |          |
|    episodes         | 6432     |
|    fps              | 2        |
|    time_elapsed     | 64287    |
|    total_timesteps  | 156090   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 10.8     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.1     |
|    ep_rew_mean      | 24.1     |
|    exploration_rate | 0.00647  |
| time/               |          |
|    episodes         | 6492     |
|    fps              | 2        |
|    time_elapsed     | 64893    |
|    total_timesteps  | 157564   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.3      |
|    n_updates        | 39140    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.2     |
|    ep_rew_mean      | 24.2     |
|    exploration_rate | 0.00643  |
| time/               |          |
|    episodes         | 6496     |
|    fps              | 2        |
|    time_elapsed     | 64923    |
|    total_timesteps  | 157628   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.495    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24       |
|    ep_rew_mean      | 24       |
|    exploration_rate | 0.0056   |
| time/               |          |
|    episodes         | 6556     |
|    fps              | 2        |
|    time_elapsed     | 65516    |
|    total_timesteps  | 159033   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.256    |
|    n_updates        | 39508    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.2     |
|    ep_rew_mean      | 24.2     |
|    exploration_rate | 0.00556  |
| time/               |          |
|    episodes         | 6560     |
|    fps              | 2        |
|    time_elapsed     | 65546    |
|    total_timesteps  | 159096   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 7.72     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 24.5     |
|    ep_rew_mean      | 24.5     |
|    exploration_rate | 0.00471  |
| time/               |          |
|    episodes         | 6620     |
|    fps              | 2        |
|    time_elapsed     | 66139    |
|    total_timesteps  | 160534   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.79     |
|    n_updates        | 39883    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 25       |
|    ep_rew_mean      | 25       |
|    exploration_rate | 0.00463  |
| time/               |          |
|    episodes         | 6624     |
|    fps              | 2        |
|    time_elapsed     | 66190    |
|    total_timesteps  | 160667   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.364    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 27       |
|    ep_rew_mean      | 27       |
|    exploration_rate | 0.00362  |
| time/               |          |
|    episodes         | 6684     |
|    fps              | 2        |
|    time_elapsed     | 66870    |
|    total_timesteps  | 162371   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.43     |
|    n_updates        | 40342    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 27.1     |
|    ep_rew_mean      | 27.1     |
|    exploration_rate | 0.00356  |
| time/               |          |
|    episodes         | 6688     |
|    fps              | 2        |
|    time_elapsed     | 66912    |
|    total_timesteps  | 162472   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.12     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 22.8     |
|    ep_rew_mean      | 22.8     |
|    exploration_rate | 0.00278  |
| time/               |          |
|    episodes         | 6748     |
|    fps              | 2        |
|    time_elapsed     | 67469    |
|    total_timesteps  | 163791   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 5.36     |
|    n_updates        | 40697    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 23.9     |
|    ep_rew_mean      | 23.9     |
|    exploration_rate | 0.00268  |
| time/               |          |
|    episodes         | 6752     |
|    fps              | 2        |
|    time_elapsed     | 67528    |
|    total_timesteps  | 163951   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.138    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 27.6     |
|    ep_rew_mean      | 27.6     |
|    exploration_rate | 0.00161  |
| time/               |          |
|    episodes         | 6812     |
|    fps              | 2        |
|    time_elapsed     | 68243    |
|    total_timesteps  | 165752   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 4.85     |
|    n_updates        | 41187    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.9     |
|    ep_rew_mean      | 28.9     |
|    exploration_rate | 0.00151  |
| time/               |          |
|    episodes         | 6816     |
|    fps              | 2        |
|    time_elapsed     | 68310    |
|    total_timesteps  | 165931   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 1.34     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.1     |
|    ep_rew_mean      | 28.1     |
|    exploration_rate | 0.000623 |
| time/               |          |
|    episodes         | 6876     |
|    fps              | 2        |
|    time_elapsed     | 68922    |
|    total_timesteps  | 167419   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.447    |
|    n_updates        | 41604    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 28.5     |
|    ep_rew_mean      | 28.5     |
|    exploration_rate | 0.00057  |
| time/               |          |
|    episodes         | 6880     |
|    fps              | 2        |
|    time_elapsed     | 68959    |
|    total_timesteps  | 167508   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 6.69     |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29       |
|    ep_rew_mean      | 29       |
|    exploration_rate | 0.0001   |
| time/               |          |
|    episodes         | 6940     |
|    fps              | 2        |
|    time_elapsed     | 69747    |
|    total_timesteps  | 169551   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 0.21     |
|    n_updates        | 42137    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 29.2     |
|    ep_rew_mean      | 29.2     |
|    exploration_rate | 0.0001   |
| time/               |          |
|    episodes         | 6944     |
|    fps              | 2        |
|    time_elapsed     | 69797    |
|    total_timesteps  | 169681   |
| train/              |          |
|    learning_rate    | 0.0006   |
|    loss             | 6.17     |
|    n_updates      

<stable_baselines3.dqn.dqn.DQN at 0x28f686b6be0>

In [16]:
# Saving the model
model.save("train/FlappyBird_DQN_Medium")
# Saving replay buffer
model.save_replay_buffer("train/buffer_FlappyBird_DQN_Medium")