# Environment Setup

In [2]:
#!pip install gym gym-retro, opencv-python

In [1]:
# For monitoring agent
from stable_baselines3.common.monitor import Monitor
# To vectorize and frame stack
from stable_baselines3.common.vec_env import DummyVecEnv, VecFrameStack

In [2]:
# Running Environment_Setup.ipynb to setup custom Flappy_Bird environment.
%run tools\Environment.py

In [3]:
LOG_DIR = './logs/'

In [4]:
# Creating environment 
env = Flappy_Bird()
env = Monitor(env, LOG_DIR)
env = DummyVecEnv([lambda: env])
env = VecFrameStack(env, 4, channels_order='last')

# Setup Callback To Monitor Training Process

In [5]:
#!pip install stable-baselines3[extra]

In [6]:
# Import os for file path management
import os 
# Import Base Callback for saving models
from stable_baselines3.common.callbacks import BaseCallback

In [7]:
class TrainAndLoggingCallback(BaseCallback):

    def __init__(self, check_freq, save_path, verbose=1):
        super(TrainAndLoggingCallback, self).__init__(verbose)
        self.check_freq = check_freq
        self.save_path = save_path

    def _init_callback(self):
        if self.save_path is not None:
            os.makedirs(self.save_path, exist_ok=True)

    def _on_step(self):
        if self.n_calls % self.check_freq == 0:
            model_path = os.path.join(self.save_path, 'best_model_{}'.format(self.n_calls))
            self.model.save(model_path)

        return True

In [8]:
CHECKPOINT_DIR = './train/'

In [9]:
callback = TrainAndLoggingCallback(check_freq=50_000, save_path=CHECKPOINT_DIR)

# Training Exploration Model

In [10]:
# Model
from stable_baselines3 import DQN

In [11]:
# parameters
parameters = {'buffer_size': 300_000, 
              'learning_starts': 2000, 
              'exploration_fraction': 0.01, 
              'exploration_final_eps': 0.04
             }

In [12]:
# Creating the model
model = DQN('CnnPolicy', env, tensorboard_log=LOG_DIR, verbose=1, **parameters)

Using cuda device


In [13]:
# Training the model
model.learn(total_timesteps=60_000, callback=callback)

Logging to ./logs/DQN_1
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.5      |
|    ep_rew_mean      | 8.5      |
|    exploration_rate | 0.999    |
| time/               |          |
|    episodes         | 4        |
|    fps              | 1        |
|    time_elapsed     | 24       |
|    total_timesteps  | 34       |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.5      |
|    ep_rew_mean      | 9.5      |
|    exploration_rate | 0.997    |
| time/               |          |
|    episodes         | 8        |
|    fps              | 1        |
|    time_elapsed     | 46       |
|    total_timesteps  | 76       |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.3     |
|    ep_rew_mean      | 10.3     |
|    exploration_rate | 0.995    |
| time/               |        

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.4     |
|    ep_rew_mean      | 10.4     |
|    exploration_rate | 0.958    |
| time/               |          |
|    episodes         | 92       |
|    fps              | 1        |
|    time_elapsed     | 500      |
|    total_timesteps  | 953      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.4     |
|    ep_rew_mean      | 10.4     |
|    exploration_rate | 0.957    |
| time/               |          |
|    episodes         | 96       |
|    fps              | 1        |
|    time_elapsed     | 521      |
|    total_timesteps  | 994      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.4     |
|    ep_rew_mean      | 10.4     |
|    exploration_rate | 0.955    |
| time/               |          |
|    episodes       

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.4     |
|    ep_rew_mean      | 10.4     |
|    exploration_rate | 0.918    |
| time/               |          |
|    episodes         | 180      |
|    fps              | 1        |
|    time_elapsed     | 975      |
|    total_timesteps  | 1869     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.4     |
|    ep_rew_mean      | 10.4     |
|    exploration_rate | 0.917    |
| time/               |          |
|    episodes         | 184      |
|    fps              | 1        |
|    time_elapsed     | 996      |
|    total_timesteps  | 1908     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.4     |
|    ep_rew_mean      | 10.4     |
|    exploration_rate | 0.915    |
| time/               |          |
|    episodes       

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.3     |
|    ep_rew_mean      | 10.3     |
|    exploration_rate | 0.888    |
| time/               |          |
|    episodes         | 248      |
|    fps              | 1        |
|    time_elapsed     | 1351     |
|    total_timesteps  | 2567     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.000124 |
|    n_updates        | 141      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.3     |
|    ep_rew_mean      | 10.3     |
|    exploration_rate | 0.886    |
| time/               |          |
|    episodes         | 252      |
|    fps              | 1        |
|    time_elapsed     | 1372     |
|    total_timesteps  | 2608     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00014  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.3     |
|    ep_rew_mean      | 10.3     |
|    exploration_rate | 0.859    |
| time/               |          |
|    episodes         | 312      |
|    fps              | 1        |
|    time_elapsed     | 1699     |
|    total_timesteps  | 3230     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.000155 |
|    n_updates        | 307      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.3     |
|    ep_rew_mean      | 10.3     |
|    exploration_rate | 0.857    |
| time/               |          |
|    episodes         | 316      |
|    fps              | 1        |
|    time_elapsed     | 1721     |
|    total_timesteps  | 3271     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.000215 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.4     |
|    ep_rew_mean      | 10.4     |
|    exploration_rate | 0.83     |
| time/               |          |
|    episodes         | 376      |
|    fps              | 1        |
|    time_elapsed     | 2051     |
|    total_timesteps  | 3904     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 4.41e-05 |
|    n_updates        | 475      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.4     |
|    ep_rew_mean      | 10.4     |
|    exploration_rate | 0.828    |
| time/               |          |
|    episodes         | 380      |
|    fps              | 1        |
|    time_elapsed     | 2073     |
|    total_timesteps  | 3945     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.71e-05 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.3     |
|    ep_rew_mean      | 10.3     |
|    exploration_rate | 0.801    |
| time/               |          |
|    episodes         | 440      |
|    fps              | 1        |
|    time_elapsed     | 2399     |
|    total_timesteps  | 4562     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.32e-05 |
|    n_updates        | 640      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.3     |
|    ep_rew_mean      | 10.3     |
|    exploration_rate | 0.799    |
| time/               |          |
|    episodes         | 444      |
|    fps              | 1        |
|    time_elapsed     | 2420     |
|    total_timesteps  | 4601     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.03e-05 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.96     |
|    ep_rew_mean      | 9.96     |
|    exploration_rate | 0.773    |
| time/               |          |
|    episodes         | 504      |
|    fps              | 1        |
|    time_elapsed     | 2742     |
|    total_timesteps  | 5197     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.9e-05  |
|    n_updates        | 799      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.99     |
|    ep_rew_mean      | 9.99     |
|    exploration_rate | 0.771    |
| time/               |          |
|    episodes         | 508      |
|    fps              | 1        |
|    time_elapsed     | 2764     |
|    total_timesteps  | 5239     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.98e-05 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10       |
|    ep_rew_mean      | 10       |
|    exploration_rate | 0.745    |
| time/               |          |
|    episodes         | 568      |
|    fps              | 1        |
|    time_elapsed     | 3088     |
|    total_timesteps  | 5843     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 4.47e-05 |
|    n_updates        | 960      |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10       |
|    ep_rew_mean      | 10       |
|    exploration_rate | 0.743    |
| time/               |          |
|    episodes         | 572      |
|    fps              | 1        |
|    time_elapsed     | 3110     |
|    total_timesteps  | 5883     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.23e-05 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.1     |
|    ep_rew_mean      | 10.1     |
|    exploration_rate | 0.717    |
| time/               |          |
|    episodes         | 632      |
|    fps              | 1        |
|    time_elapsed     | 3434     |
|    total_timesteps  | 6492     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.15e-05 |
|    n_updates        | 1122     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.2     |
|    ep_rew_mean      | 10.2     |
|    exploration_rate | 0.715    |
| time/               |          |
|    episodes         | 636      |
|    fps              | 1        |
|    time_elapsed     | 3455     |
|    total_timesteps  | 6530     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.96e-05 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.97     |
|    ep_rew_mean      | 9.97     |
|    exploration_rate | 0.689    |
| time/               |          |
|    episodes         | 696      |
|    fps              | 1        |
|    time_elapsed     | 3777     |
|    total_timesteps  | 7123     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 7.5e-06  |
|    n_updates        | 1280     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.94     |
|    ep_rew_mean      | 9.94     |
|    exploration_rate | 0.688    |
| time/               |          |
|    episodes         | 700      |
|    fps              | 1        |
|    time_elapsed     | 3798     |
|    total_timesteps  | 7159     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.47e-05 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10       |
|    ep_rew_mean      | 10       |
|    exploration_rate | 0.661    |
| time/               |          |
|    episodes         | 760      |
|    fps              | 1        |
|    time_elapsed     | 4125     |
|    total_timesteps  | 7776     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.17e-05 |
|    n_updates        | 1443     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.98     |
|    ep_rew_mean      | 9.98     |
|    exploration_rate | 0.659    |
| time/               |          |
|    episodes         | 764      |
|    fps              | 1        |
|    time_elapsed     | 4146     |
|    total_timesteps  | 7813     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.45e-05 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10       |
|    ep_rew_mean      | 10       |
|    exploration_rate | 0.633    |
| time/               |          |
|    episodes         | 824      |
|    fps              | 1        |
|    time_elapsed     | 4471     |
|    total_timesteps  | 8417     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.74e-05 |
|    n_updates        | 1604     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10       |
|    ep_rew_mean      | 10       |
|    exploration_rate | 0.631    |
| time/               |          |
|    episodes         | 828      |
|    fps              | 1        |
|    time_elapsed     | 4492     |
|    total_timesteps  | 8453     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 7.3e-06  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.1     |
|    ep_rew_mean      | 10.1     |
|    exploration_rate | 0.605    |
| time/               |          |
|    episodes         | 888      |
|    fps              | 1        |
|    time_elapsed     | 4820     |
|    total_timesteps  | 9059     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 8.38e-05 |
|    n_updates        | 1764     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.1     |
|    ep_rew_mean      | 10.1     |
|    exploration_rate | 0.603    |
| time/               |          |
|    episodes         | 892      |
|    fps              | 1        |
|    time_elapsed     | 4842     |
|    total_timesteps  | 9102     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 6.71e-05 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.78     |
|    ep_rew_mean      | 9.78     |
|    exploration_rate | 0.577    |
| time/               |          |
|    episodes         | 952      |
|    fps              | 1        |
|    time_elapsed     | 5164     |
|    total_timesteps  | 9683     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.72e-05 |
|    n_updates        | 1920     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.79     |
|    ep_rew_mean      | 9.79     |
|    exploration_rate | 0.576    |
| time/               |          |
|    episodes         | 956      |
|    fps              | 1        |
|    time_elapsed     | 5186     |
|    total_timesteps  | 9722     |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.17e-05 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.51     |
|    ep_rew_mean      | 9.51     |
|    exploration_rate | 0.551    |
| time/               |          |
|    episodes         | 1016     |
|    fps              | 1        |
|    time_elapsed     | 5503     |
|    total_timesteps  | 10284    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0481   |
|    n_updates        | 2070     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.47     |
|    ep_rew_mean      | 9.47     |
|    exploration_rate | 0.55     |
| time/               |          |
|    episodes         | 1020     |
|    fps              | 1        |
|    time_elapsed     | 5524     |
|    total_timesteps  | 10320    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0358   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.71     |
|    ep_rew_mean      | 9.71     |
|    exploration_rate | 0.524    |
| time/               |          |
|    episodes         | 1080     |
|    fps              | 1        |
|    time_elapsed     | 5848     |
|    total_timesteps  | 10919    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.039    |
|    n_updates        | 2229     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.64     |
|    ep_rew_mean      | 9.64     |
|    exploration_rate | 0.522    |
| time/               |          |
|    episodes         | 1084     |
|    fps              | 1        |
|    time_elapsed     | 5868     |
|    total_timesteps  | 10953    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00847  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.99     |
|    ep_rew_mean      | 9.99     |
|    exploration_rate | 0.496    |
| time/               |          |
|    episodes         | 1144     |
|    fps              | 1        |
|    time_elapsed     | 6195     |
|    total_timesteps  | 11558    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0183   |
|    n_updates        | 2389     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.98     |
|    ep_rew_mean      | 9.98     |
|    exploration_rate | 0.494    |
| time/               |          |
|    episodes         | 1148     |
|    fps              | 1        |
|    time_elapsed     | 6216     |
|    total_timesteps  | 11598    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0447   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.1     |
|    ep_rew_mean      | 10.1     |
|    exploration_rate | 0.468    |
| time/               |          |
|    episodes         | 1208     |
|    fps              | 1        |
|    time_elapsed     | 6544     |
|    total_timesteps  | 12200    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0193   |
|    n_updates        | 2549     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 10.1     |
|    ep_rew_mean      | 10.1     |
|    exploration_rate | 0.466    |
| time/               |          |
|    episodes         | 1212     |
|    fps              | 1        |
|    time_elapsed     | 6565     |
|    total_timesteps  | 12238    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00969  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.73     |
|    ep_rew_mean      | 9.73     |
|    exploration_rate | 0.441    |
| time/               |          |
|    episodes         | 1272     |
|    fps              | 1        |
|    time_elapsed     | 6886     |
|    total_timesteps  | 12815    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0125   |
|    n_updates        | 2703     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.7      |
|    ep_rew_mean      | 9.7      |
|    exploration_rate | 0.439    |
| time/               |          |
|    episodes         | 1276     |
|    fps              | 1        |
|    time_elapsed     | 6906     |
|    total_timesteps  | 12849    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0181   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.43     |
|    ep_rew_mean      | 9.43     |
|    exploration_rate | 0.415    |
| time/               |          |
|    episodes         | 1336     |
|    fps              | 1        |
|    time_elapsed     | 7225     |
|    total_timesteps  | 13410    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00955  |
|    n_updates        | 2852     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.44     |
|    ep_rew_mean      | 9.44     |
|    exploration_rate | 0.413    |
| time/               |          |
|    episodes         | 1340     |
|    fps              | 1        |
|    time_elapsed     | 7247     |
|    total_timesteps  | 13452    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00805  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.53     |
|    ep_rew_mean      | 9.53     |
|    exploration_rate | 0.388    |
| time/               |          |
|    episodes         | 1400     |
|    fps              | 1        |
|    time_elapsed     | 7569     |
|    total_timesteps  | 14033    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00627  |
|    n_updates        | 3008     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.47     |
|    ep_rew_mean      | 9.47     |
|    exploration_rate | 0.386    |
| time/               |          |
|    episodes         | 1404     |
|    fps              | 1        |
|    time_elapsed     | 7591     |
|    total_timesteps  | 14070    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00577  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.59     |
|    ep_rew_mean      | 9.59     |
|    exploration_rate | 0.361    |
| time/               |          |
|    episodes         | 1464     |
|    fps              | 1        |
|    time_elapsed     | 7910     |
|    total_timesteps  | 14642    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00132  |
|    n_updates        | 3160     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.63     |
|    ep_rew_mean      | 9.63     |
|    exploration_rate | 0.359    |
| time/               |          |
|    episodes         | 1468     |
|    fps              | 1        |
|    time_elapsed     | 7932     |
|    total_timesteps  | 14686    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00367  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.7      |
|    ep_rew_mean      | 9.7      |
|    exploration_rate | 0.334    |
| time/               |          |
|    episodes         | 1528     |
|    fps              | 1        |
|    time_elapsed     | 8255     |
|    total_timesteps  | 15268    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0036   |
|    n_updates        | 3316     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.77     |
|    ep_rew_mean      | 9.77     |
|    exploration_rate | 0.332    |
| time/               |          |
|    episodes         | 1532     |
|    fps              | 1        |
|    time_elapsed     | 8276     |
|    total_timesteps  | 15308    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00596  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.42     |
|    ep_rew_mean      | 9.42     |
|    exploration_rate | 0.308    |
| time/               |          |
|    episodes         | 1592     |
|    fps              | 1        |
|    time_elapsed     | 8592     |
|    total_timesteps  | 15862    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00599  |
|    n_updates        | 3465     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.36     |
|    ep_rew_mean      | 9.36     |
|    exploration_rate | 0.306    |
| time/               |          |
|    episodes         | 1596     |
|    fps              | 1        |
|    time_elapsed     | 8613     |
|    total_timesteps  | 15896    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00871  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.29     |
|    ep_rew_mean      | 9.29     |
|    exploration_rate | 0.282    |
| time/               |          |
|    episodes         | 1656     |
|    fps              | 1        |
|    time_elapsed     | 8929     |
|    total_timesteps  | 16453    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00788  |
|    n_updates        | 3613     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.33     |
|    ep_rew_mean      | 9.33     |
|    exploration_rate | 0.28     |
| time/               |          |
|    episodes         | 1660     |
|    fps              | 1        |
|    time_elapsed     | 8951     |
|    total_timesteps  | 16492    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0319   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.22     |
|    ep_rew_mean      | 9.22     |
|    exploration_rate | 0.256    |
| time/               |          |
|    episodes         | 1720     |
|    fps              | 1        |
|    time_elapsed     | 9272     |
|    total_timesteps  | 17061    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0125   |
|    n_updates        | 3765     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.15     |
|    ep_rew_mean      | 9.15     |
|    exploration_rate | 0.254    |
| time/               |          |
|    episodes         | 1724     |
|    fps              | 1        |
|    time_elapsed     | 9293     |
|    total_timesteps  | 17096    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0132   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.14     |
|    ep_rew_mean      | 9.14     |
|    exploration_rate | 0.23     |
| time/               |          |
|    episodes         | 1784     |
|    fps              | 1        |
|    time_elapsed     | 9606     |
|    total_timesteps  | 17638    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0135   |
|    n_updates        | 3909     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.14     |
|    ep_rew_mean      | 9.14     |
|    exploration_rate | 0.229    |
| time/               |          |
|    episodes         | 1788     |
|    fps              | 1        |
|    time_elapsed     | 9628     |
|    total_timesteps  | 17677    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0126   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.14     |
|    ep_rew_mean      | 9.14     |
|    exploration_rate | 0.205    |
| time/               |          |
|    episodes         | 1848     |
|    fps              | 1        |
|    time_elapsed     | 9943     |
|    total_timesteps  | 18222    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00453  |
|    n_updates        | 4055     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.16     |
|    ep_rew_mean      | 9.16     |
|    exploration_rate | 0.203    |
| time/               |          |
|    episodes         | 1852     |
|    fps              | 1        |
|    time_elapsed     | 9963     |
|    total_timesteps  | 18256    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00786  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.08     |
|    ep_rew_mean      | 9.08     |
|    exploration_rate | 0.18     |
| time/               |          |
|    episodes         | 1912     |
|    fps              | 1        |
|    time_elapsed     | 10279    |
|    total_timesteps  | 18801    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00461  |
|    n_updates        | 4200     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.07     |
|    ep_rew_mean      | 9.07     |
|    exploration_rate | 0.178    |
| time/               |          |
|    episodes         | 1916     |
|    fps              | 1        |
|    time_elapsed     | 10302    |
|    total_timesteps  | 18842    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.012    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.21     |
|    ep_rew_mean      | 9.21     |
|    exploration_rate | 0.153    |
| time/               |          |
|    episodes         | 1976     |
|    fps              | 1        |
|    time_elapsed     | 10620    |
|    total_timesteps  | 19400    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0136   |
|    n_updates        | 4349     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.25     |
|    ep_rew_mean      | 9.25     |
|    exploration_rate | 0.152    |
| time/               |          |
|    episodes         | 1980     |
|    fps              | 1        |
|    time_elapsed     | 10642    |
|    total_timesteps  | 19439    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00124  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.76     |
|    ep_rew_mean      | 8.76     |
|    exploration_rate | 0.129    |
| time/               |          |
|    episodes         | 2040     |
|    fps              | 1        |
|    time_elapsed     | 10952    |
|    total_timesteps  | 19956    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00359  |
|    n_updates        | 4488     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.81     |
|    ep_rew_mean      | 8.81     |
|    exploration_rate | 0.127    |
| time/               |          |
|    episodes         | 2044     |
|    fps              | 1        |
|    time_elapsed     | 10974    |
|    total_timesteps  | 19995    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.000947 |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.79     |
|    ep_rew_mean      | 8.79     |
|    exploration_rate | 0.104    |
| time/               |          |
|    episodes         | 2104     |
|    fps              | 1        |
|    time_elapsed     | 11286    |
|    total_timesteps  | 20523    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0276   |
|    n_updates        | 4630     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.82     |
|    ep_rew_mean      | 8.82     |
|    exploration_rate | 0.103    |
| time/               |          |
|    episodes         | 2108     |
|    fps              | 1        |
|    time_elapsed     | 11307    |
|    total_timesteps  | 20559    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.014    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.75     |
|    ep_rew_mean      | 8.75     |
|    exploration_rate | 0.08     |
| time/               |          |
|    episodes         | 2168     |
|    fps              | 1        |
|    time_elapsed     | 11619    |
|    total_timesteps  | 21084    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00747  |
|    n_updates        | 4770     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.66     |
|    ep_rew_mean      | 8.66     |
|    exploration_rate | 0.0786   |
| time/               |          |
|    episodes         | 2172     |
|    fps              | 1        |
|    time_elapsed     | 11638    |
|    total_timesteps  | 21115    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0266   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.44     |
|    ep_rew_mean      | 8.44     |
|    exploration_rate | 0.0567   |
| time/               |          |
|    episodes         | 2232     |
|    fps              | 1        |
|    time_elapsed     | 11946    |
|    total_timesteps  | 21617    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00724  |
|    n_updates        | 4904     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.49     |
|    ep_rew_mean      | 8.49     |
|    exploration_rate | 0.0552   |
| time/               |          |
|    episodes         | 2236     |
|    fps              | 1        |
|    time_elapsed     | 11966    |
|    total_timesteps  | 21652    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00416  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.73     |
|    ep_rew_mean      | 8.73     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2296     |
|    fps              | 1        |
|    time_elapsed     | 12282    |
|    total_timesteps  | 22185    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00293  |
|    n_updates        | 5046     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.7      |
|    ep_rew_mean      | 8.7      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2300     |
|    fps              | 1        |
|    time_elapsed     | 12302    |
|    total_timesteps  | 22218    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0052   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.75     |
|    ep_rew_mean      | 8.75     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2360     |
|    fps              | 1        |
|    time_elapsed     | 12616    |
|    total_timesteps  | 22749    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00744  |
|    n_updates        | 5187     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.81     |
|    ep_rew_mean      | 8.81     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2364     |
|    fps              | 1        |
|    time_elapsed     | 12638    |
|    total_timesteps  | 22791    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00446  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.67     |
|    ep_rew_mean      | 8.67     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2424     |
|    fps              | 1        |
|    time_elapsed     | 12944    |
|    total_timesteps  | 23298    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00275  |
|    n_updates        | 5324     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.64     |
|    ep_rew_mean      | 8.64     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2428     |
|    fps              | 1        |
|    time_elapsed     | 12964    |
|    total_timesteps  | 23329    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00544  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.45     |
|    ep_rew_mean      | 8.45     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2488     |
|    fps              | 1        |
|    time_elapsed     | 13274    |
|    total_timesteps  | 23846    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.013    |
|    n_updates        | 5461     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.39     |
|    ep_rew_mean      | 8.39     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2492     |
|    fps              | 1        |
|    time_elapsed     | 13294    |
|    total_timesteps  | 23875    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.006    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.55     |
|    ep_rew_mean      | 8.55     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2552     |
|    fps              | 1        |
|    time_elapsed     | 13601    |
|    total_timesteps  | 24389    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0095   |
|    n_updates        | 5597     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.67     |
|    ep_rew_mean      | 8.67     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2556     |
|    fps              | 1        |
|    time_elapsed     | 13624    |
|    total_timesteps  | 24429    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0119   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.57     |
|    ep_rew_mean      | 8.57     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2616     |
|    fps              | 1        |
|    time_elapsed     | 13933    |
|    total_timesteps  | 24952    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00163  |
|    n_updates        | 5737     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.55     |
|    ep_rew_mean      | 8.55     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2620     |
|    fps              | 1        |
|    time_elapsed     | 13952    |
|    total_timesteps  | 24981    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00446  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.7      |
|    ep_rew_mean      | 8.7      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2680     |
|    fps              | 1        |
|    time_elapsed     | 14264    |
|    total_timesteps  | 25503    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00463  |
|    n_updates        | 5875     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.61     |
|    ep_rew_mean      | 8.61     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2684     |
|    fps              | 1        |
|    time_elapsed     | 14283    |
|    total_timesteps  | 25531    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00486  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.4      |
|    ep_rew_mean      | 8.4      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2744     |
|    fps              | 1        |
|    time_elapsed     | 14585    |
|    total_timesteps  | 26019    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0155   |
|    n_updates        | 6004     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.44     |
|    ep_rew_mean      | 8.44     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2748     |
|    fps              | 1        |
|    time_elapsed     | 14606    |
|    total_timesteps  | 26053    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00491  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.42     |
|    ep_rew_mean      | 8.42     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2808     |
|    fps              | 1        |
|    time_elapsed     | 14916    |
|    total_timesteps  | 26571    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00843  |
|    n_updates        | 6142     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.42     |
|    ep_rew_mean      | 8.42     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2812     |
|    fps              | 1        |
|    time_elapsed     | 14936    |
|    total_timesteps  | 26602    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.013    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.6      |
|    ep_rew_mean      | 8.6      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2872     |
|    fps              | 1        |
|    time_elapsed     | 15245    |
|    total_timesteps  | 27113    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00917  |
|    n_updates        | 6278     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.65     |
|    ep_rew_mean      | 8.65     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2876     |
|    fps              | 1        |
|    time_elapsed     | 15265    |
|    total_timesteps  | 27147    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0135   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.15     |
|    ep_rew_mean      | 8.15     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2936     |
|    fps              | 1        |
|    time_elapsed     | 15565    |
|    total_timesteps  | 27628    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0135   |
|    n_updates        | 6406     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.1      |
|    ep_rew_mean      | 8.1      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 2940     |
|    fps              | 1        |
|    time_elapsed     | 15585    |
|    total_timesteps  | 27662    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00431  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.33     |
|    ep_rew_mean      | 8.33     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3000     |
|    fps              | 1        |
|    time_elapsed     | 15895    |
|    total_timesteps  | 28178    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0257   |
|    n_updates        | 6544     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.41     |
|    ep_rew_mean      | 8.41     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3004     |
|    fps              | 1        |
|    time_elapsed     | 15916    |
|    total_timesteps  | 28212    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00554  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.54     |
|    ep_rew_mean      | 8.54     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3064     |
|    fps              | 1        |
|    time_elapsed     | 16228    |
|    total_timesteps  | 28731    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00989  |
|    n_updates        | 6682     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.6      |
|    ep_rew_mean      | 8.6      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3068     |
|    fps              | 1        |
|    time_elapsed     | 16250    |
|    total_timesteps  | 28769    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00564  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.57     |
|    ep_rew_mean      | 8.57     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3128     |
|    fps              | 1        |
|    time_elapsed     | 16559    |
|    total_timesteps  | 29282    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.000862 |
|    n_updates        | 6820     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.6      |
|    ep_rew_mean      | 8.6      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3132     |
|    fps              | 1        |
|    time_elapsed     | 16580    |
|    total_timesteps  | 29319    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00284  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.81     |
|    ep_rew_mean      | 8.81     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3192     |
|    fps              | 1        |
|    time_elapsed     | 16892    |
|    total_timesteps  | 29845    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00209  |
|    n_updates        | 6961     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.78     |
|    ep_rew_mean      | 8.78     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3196     |
|    fps              | 1        |
|    time_elapsed     | 16913    |
|    total_timesteps  | 29881    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00808  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.3      |
|    ep_rew_mean      | 8.3      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3256     |
|    fps              | 1        |
|    time_elapsed     | 17219    |
|    total_timesteps  | 30372    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0216   |
|    n_updates        | 7092     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.25     |
|    ep_rew_mean      | 8.25     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3260     |
|    fps              | 1        |
|    time_elapsed     | 17239    |
|    total_timesteps  | 30402    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.012    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.34     |
|    ep_rew_mean      | 8.34     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3320     |
|    fps              | 1        |
|    time_elapsed     | 17546    |
|    total_timesteps  | 30909    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0301   |
|    n_updates        | 7227     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.35     |
|    ep_rew_mean      | 8.35     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3324     |
|    fps              | 1        |
|    time_elapsed     | 17565    |
|    total_timesteps  | 30938    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00562  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.25     |
|    ep_rew_mean      | 8.25     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3384     |
|    fps              | 1        |
|    time_elapsed     | 17866    |
|    total_timesteps  | 31421    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0154   |
|    n_updates        | 7355     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.38     |
|    ep_rew_mean      | 8.38     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3388     |
|    fps              | 1        |
|    time_elapsed     | 17888    |
|    total_timesteps  | 31463    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00464  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.42     |
|    ep_rew_mean      | 8.42     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3448     |
|    fps              | 1        |
|    time_elapsed     | 18196    |
|    total_timesteps  | 31970    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0272   |
|    n_updates        | 7492     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.49     |
|    ep_rew_mean      | 8.49     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3452     |
|    fps              | 1        |
|    time_elapsed     | 18218    |
|    total_timesteps  | 32009    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00595  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.84     |
|    ep_rew_mean      | 8.84     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3512     |
|    fps              | 1        |
|    time_elapsed     | 18536    |
|    total_timesteps  | 32555    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00315  |
|    n_updates        | 7638     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.95     |
|    ep_rew_mean      | 8.95     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3516     |
|    fps              | 1        |
|    time_elapsed     | 18557    |
|    total_timesteps  | 32592    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00416  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.84     |
|    ep_rew_mean      | 8.84     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3576     |
|    fps              | 1        |
|    time_elapsed     | 18868    |
|    total_timesteps  | 33117    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0128   |
|    n_updates        | 7779     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.89     |
|    ep_rew_mean      | 8.89     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3580     |
|    fps              | 1        |
|    time_elapsed     | 18889    |
|    total_timesteps  | 33155    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0157   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.91     |
|    ep_rew_mean      | 8.91     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3640     |
|    fps              | 1        |
|    time_elapsed     | 19204    |
|    total_timesteps  | 33687    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0173   |
|    n_updates        | 7921     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.96     |
|    ep_rew_mean      | 8.96     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3644     |
|    fps              | 1        |
|    time_elapsed     | 19225    |
|    total_timesteps  | 33724    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00284  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.8      |
|    ep_rew_mean      | 8.8      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3704     |
|    fps              | 1        |
|    time_elapsed     | 19538    |
|    total_timesteps  | 34253    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00545  |
|    n_updates        | 8063     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.71     |
|    ep_rew_mean      | 8.71     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3708     |
|    fps              | 1        |
|    time_elapsed     | 19557    |
|    total_timesteps  | 34281    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00777  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.61     |
|    ep_rew_mean      | 8.61     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3768     |
|    fps              | 1        |
|    time_elapsed     | 19865    |
|    total_timesteps  | 34791    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0187   |
|    n_updates        | 8197     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.61     |
|    ep_rew_mean      | 8.61     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3772     |
|    fps              | 1        |
|    time_elapsed     | 19885    |
|    total_timesteps  | 34822    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00534  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.29     |
|    ep_rew_mean      | 8.29     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3832     |
|    fps              | 1        |
|    time_elapsed     | 20189    |
|    total_timesteps  | 35314    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0118   |
|    n_updates        | 8328     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.25     |
|    ep_rew_mean      | 8.25     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3836     |
|    fps              | 1        |
|    time_elapsed     | 20209    |
|    total_timesteps  | 35348    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0203   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.59     |
|    ep_rew_mean      | 8.59     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3896     |
|    fps              | 1        |
|    time_elapsed     | 20520    |
|    total_timesteps  | 35866    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00333  |
|    n_updates        | 8466     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.68     |
|    ep_rew_mean      | 8.68     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3900     |
|    fps              | 1        |
|    time_elapsed     | 20542    |
|    total_timesteps  | 35904    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00327  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.54     |
|    ep_rew_mean      | 8.54     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3960     |
|    fps              | 1        |
|    time_elapsed     | 20847    |
|    total_timesteps  | 36406    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00979  |
|    n_updates        | 8601     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.49     |
|    ep_rew_mean      | 8.49     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 3964     |
|    fps              | 1        |
|    time_elapsed     | 20867    |
|    total_timesteps  | 36440    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00411  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.63     |
|    ep_rew_mean      | 8.63     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4024     |
|    fps              | 1        |
|    time_elapsed     | 21178    |
|    total_timesteps  | 36952    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00407  |
|    n_updates        | 8737     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.57     |
|    ep_rew_mean      | 8.57     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4028     |
|    fps              | 1        |
|    time_elapsed     | 21198    |
|    total_timesteps  | 36985    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00258  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.39     |
|    ep_rew_mean      | 8.39     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4088     |
|    fps              | 1        |
|    time_elapsed     | 21505    |
|    total_timesteps  | 37484    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0112   |
|    n_updates        | 8870     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.38     |
|    ep_rew_mean      | 8.38     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4092     |
|    fps              | 1        |
|    time_elapsed     | 21526    |
|    total_timesteps  | 37521    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0035   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.64     |
|    ep_rew_mean      | 8.64     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4152     |
|    fps              | 1        |
|    time_elapsed     | 21840    |
|    total_timesteps  | 38054    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0136   |
|    n_updates        | 9013     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.67     |
|    ep_rew_mean      | 8.67     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4156     |
|    fps              | 1        |
|    time_elapsed     | 21863    |
|    total_timesteps  | 38095    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.032    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.11     |
|    ep_rew_mean      | 9.11     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4216     |
|    fps              | 1        |
|    time_elapsed     | 22179    |
|    total_timesteps  | 38633    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00476  |
|    n_updates        | 9158     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.08     |
|    ep_rew_mean      | 9.08     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4220     |
|    fps              | 1        |
|    time_elapsed     | 22199    |
|    total_timesteps  | 38664    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00104  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.79     |
|    ep_rew_mean      | 8.79     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4280     |
|    fps              | 1        |
|    time_elapsed     | 22512    |
|    total_timesteps  | 39193    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0246   |
|    n_updates        | 9298     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.8      |
|    ep_rew_mean      | 8.8      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4284     |
|    fps              | 1        |
|    time_elapsed     | 22534    |
|    total_timesteps  | 39232    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0031   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.63     |
|    ep_rew_mean      | 8.63     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4344     |
|    fps              | 1        |
|    time_elapsed     | 22841    |
|    total_timesteps  | 39736    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00828  |
|    n_updates        | 9433     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.6      |
|    ep_rew_mean      | 8.6      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4348     |
|    fps              | 1        |
|    time_elapsed     | 22861    |
|    total_timesteps  | 39769    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00629  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.65     |
|    ep_rew_mean      | 8.65     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4408     |
|    fps              | 1        |
|    time_elapsed     | 23176    |
|    total_timesteps  | 40295    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0134   |
|    n_updates        | 9573     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.67     |
|    ep_rew_mean      | 8.67     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4412     |
|    fps              | 1        |
|    time_elapsed     | 23196    |
|    total_timesteps  | 40325    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.028    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.68     |
|    ep_rew_mean      | 8.68     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4472     |
|    fps              | 1        |
|    time_elapsed     | 23506    |
|    total_timesteps  | 40837    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0195   |
|    n_updates        | 9709     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.73     |
|    ep_rew_mean      | 8.73     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4476     |
|    fps              | 1        |
|    time_elapsed     | 23527    |
|    total_timesteps  | 40873    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0204   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.02     |
|    ep_rew_mean      | 9.02     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4536     |
|    fps              | 1        |
|    time_elapsed     | 23845    |
|    total_timesteps  | 41425    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00901  |
|    n_updates        | 9856     |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.06     |
|    ep_rew_mean      | 9.06     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4540     |
|    fps              | 1        |
|    time_elapsed     | 23867    |
|    total_timesteps  | 41465    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00815  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.51     |
|    ep_rew_mean      | 9.51     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4600     |
|    fps              | 1        |
|    time_elapsed     | 24190    |
|    total_timesteps  | 42032    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0103   |
|    n_updates        | 10007    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.41     |
|    ep_rew_mean      | 9.41     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4604     |
|    fps              | 1        |
|    time_elapsed     | 24210    |
|    total_timesteps  | 42062    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00865  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.18     |
|    ep_rew_mean      | 9.18     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4664     |
|    fps              | 1        |
|    time_elapsed     | 24525    |
|    total_timesteps  | 42603    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00749  |
|    n_updates        | 10150    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.24     |
|    ep_rew_mean      | 9.24     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4668     |
|    fps              | 1        |
|    time_elapsed     | 24547    |
|    total_timesteps  | 42641    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00929  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.02     |
|    ep_rew_mean      | 9.02     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4728     |
|    fps              | 1        |
|    time_elapsed     | 24864    |
|    total_timesteps  | 43185    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0132   |
|    n_updates        | 10296    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.09     |
|    ep_rew_mean      | 9.09     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4732     |
|    fps              | 1        |
|    time_elapsed     | 24886    |
|    total_timesteps  | 43223    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0066   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.12     |
|    ep_rew_mean      | 9.12     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4792     |
|    fps              | 1        |
|    time_elapsed     | 25208    |
|    total_timesteps  | 43788    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00798  |
|    n_updates        | 10446    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.16     |
|    ep_rew_mean      | 9.16     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4796     |
|    fps              | 1        |
|    time_elapsed     | 25229    |
|    total_timesteps  | 43820    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0497   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.8      |
|    ep_rew_mean      | 8.8      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4856     |
|    fps              | 1        |
|    time_elapsed     | 25539    |
|    total_timesteps  | 44341    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0199   |
|    n_updates        | 10585    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.83     |
|    ep_rew_mean      | 8.83     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4860     |
|    fps              | 1        |
|    time_elapsed     | 25559    |
|    total_timesteps  | 44372    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0243   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.78     |
|    ep_rew_mean      | 8.78     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4920     |
|    fps              | 1        |
|    time_elapsed     | 25873    |
|    total_timesteps  | 44902    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0136   |
|    n_updates        | 10725    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.81     |
|    ep_rew_mean      | 8.81     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4924     |
|    fps              | 1        |
|    time_elapsed     | 25893    |
|    total_timesteps  | 44933    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00895  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.99     |
|    ep_rew_mean      | 8.99     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4984     |
|    fps              | 1        |
|    time_elapsed     | 26212    |
|    total_timesteps  | 45486    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00252  |
|    n_updates        | 10871    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9        |
|    ep_rew_mean      | 9        |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 4988     |
|    fps              | 1        |
|    time_elapsed     | 26233    |
|    total_timesteps  | 45524    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0119   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.23     |
|    ep_rew_mean      | 9.23     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5048     |
|    fps              | 1        |
|    time_elapsed     | 26549    |
|    total_timesteps  | 46064    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0169   |
|    n_updates        | 11015    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.21     |
|    ep_rew_mean      | 9.21     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5052     |
|    fps              | 1        |
|    time_elapsed     | 26571    |
|    total_timesteps  | 46105    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00874  |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.09     |
|    ep_rew_mean      | 9.09     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5112     |
|    fps              | 1        |
|    time_elapsed     | 26885    |
|    total_timesteps  | 46641    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00939  |
|    n_updates        | 11160    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.12     |
|    ep_rew_mean      | 9.12     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5116     |
|    fps              | 1        |
|    time_elapsed     | 26908    |
|    total_timesteps  | 46683    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0221   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.96     |
|    ep_rew_mean      | 8.96     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5176     |
|    fps              | 1        |
|    time_elapsed     | 27224    |
|    total_timesteps  | 47229    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0124   |
|    n_updates        | 11307    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 8.88     |
|    ep_rew_mean      | 8.88     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5180     |
|    fps              | 1        |
|    time_elapsed     | 27244    |
|    total_timesteps  | 47260    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0141   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.04     |
|    ep_rew_mean      | 9.04     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5240     |
|    fps              | 1        |
|    time_elapsed     | 27563    |
|    total_timesteps  | 47809    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0103   |
|    n_updates        | 11452    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.08     |
|    ep_rew_mean      | 9.08     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5244     |
|    fps              | 1        |
|    time_elapsed     | 27584    |
|    total_timesteps  | 47847    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0158   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.41     |
|    ep_rew_mean      | 9.41     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5304     |
|    fps              | 1        |
|    time_elapsed     | 27908    |
|    total_timesteps  | 48412    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0057   |
|    n_updates        | 11602    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.44     |
|    ep_rew_mean      | 9.44     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5308     |
|    fps              | 1        |
|    time_elapsed     | 27929    |
|    total_timesteps  | 48449    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0099   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.44     |
|    ep_rew_mean      | 9.44     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5368     |
|    fps              | 1        |
|    time_elapsed     | 28251    |
|    total_timesteps  | 49017    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0138   |
|    n_updates        | 11754    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.46     |
|    ep_rew_mean      | 9.46     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5372     |
|    fps              | 1        |
|    time_elapsed     | 28273    |
|    total_timesteps  | 49057    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0129   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.46     |
|    ep_rew_mean      | 9.46     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5432     |
|    fps              | 1        |
|    time_elapsed     | 28592    |
|    total_timesteps  | 49609    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00864  |
|    n_updates        | 11902    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.42     |
|    ep_rew_mean      | 9.42     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5436     |
|    fps              | 1        |
|    time_elapsed     | 28613    |
|    total_timesteps  | 49646    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0134   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.52     |
|    ep_rew_mean      | 9.52     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5496     |
|    fps              | 1        |
|    time_elapsed     | 28938    |
|    total_timesteps  | 50219    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0677   |
|    n_updates        | 12054    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.52     |
|    ep_rew_mean      | 9.52     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5500     |
|    fps              | 1        |
|    time_elapsed     | 28960    |
|    total_timesteps  | 50259    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0317   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.66     |
|    ep_rew_mean      | 9.66     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5560     |
|    fps              | 1        |
|    time_elapsed     | 29291    |
|    total_timesteps  | 50852    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0365   |
|    n_updates        | 12212    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.77     |
|    ep_rew_mean      | 9.77     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5564     |
|    fps              | 1        |
|    time_elapsed     | 29313    |
|    total_timesteps  | 50891    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0272   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.73     |
|    ep_rew_mean      | 9.73     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5624     |
|    fps              | 1        |
|    time_elapsed     | 29639    |
|    total_timesteps  | 51470    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0359   |
|    n_updates        | 12367    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.69     |
|    ep_rew_mean      | 9.69     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5628     |
|    fps              | 1        |
|    time_elapsed     | 29661    |
|    total_timesteps  | 51507    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0197   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.79     |
|    ep_rew_mean      | 9.79     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5688     |
|    fps              | 1        |
|    time_elapsed     | 29989    |
|    total_timesteps  | 52102    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0273   |
|    n_updates        | 12525    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.79     |
|    ep_rew_mean      | 9.79     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5692     |
|    fps              | 1        |
|    time_elapsed     | 30011    |
|    total_timesteps  | 52142    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0265   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.9      |
|    ep_rew_mean      | 9.9      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5752     |
|    fps              | 1        |
|    time_elapsed     | 30341    |
|    total_timesteps  | 52740    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0191   |
|    n_updates        | 12684    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.9      |
|    ep_rew_mean      | 9.9      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5756     |
|    fps              | 1        |
|    time_elapsed     | 30363    |
|    total_timesteps  | 52780    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0201   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.68     |
|    ep_rew_mean      | 9.68     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5816     |
|    fps              | 1        |
|    time_elapsed     | 30685    |
|    total_timesteps  | 53344    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0327   |
|    n_updates        | 12835    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.64     |
|    ep_rew_mean      | 9.64     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5820     |
|    fps              | 1        |
|    time_elapsed     | 30706    |
|    total_timesteps  | 53381    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0361   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.58     |
|    ep_rew_mean      | 9.58     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5880     |
|    fps              | 1        |
|    time_elapsed     | 31035    |
|    total_timesteps  | 53974    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0292   |
|    n_updates        | 12993    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.58     |
|    ep_rew_mean      | 9.58     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5884     |
|    fps              | 1        |
|    time_elapsed     | 31057    |
|    total_timesteps  | 54014    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0134   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.67     |
|    ep_rew_mean      | 9.67     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5944     |
|    fps              | 1        |
|    time_elapsed     | 31381    |
|    total_timesteps  | 54583    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0267   |
|    n_updates        | 13145    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.66     |
|    ep_rew_mean      | 9.66     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 5948     |
|    fps              | 1        |
|    time_elapsed     | 31403    |
|    total_timesteps  | 54623    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0191   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.79     |
|    ep_rew_mean      | 9.79     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6008     |
|    fps              | 1        |
|    time_elapsed     | 31733    |
|    total_timesteps  | 55223    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0221   |
|    n_updates        | 13305    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.8      |
|    ep_rew_mean      | 9.8      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6012     |
|    fps              | 1        |
|    time_elapsed     | 31755    |
|    total_timesteps  | 55263    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0357   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.79     |
|    ep_rew_mean      | 9.79     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6072     |
|    fps              | 1        |
|    time_elapsed     | 32081    |
|    total_timesteps  | 55842    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0392   |
|    n_updates        | 13460    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.79     |
|    ep_rew_mean      | 9.79     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6076     |
|    fps              | 1        |
|    time_elapsed     | 32103    |
|    total_timesteps  | 55883    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0108   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.64     |
|    ep_rew_mean      | 9.64     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6136     |
|    fps              | 1        |
|    time_elapsed     | 32431    |
|    total_timesteps  | 56465    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0196   |
|    n_updates        | 13616    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.64     |
|    ep_rew_mean      | 9.64     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6140     |
|    fps              | 1        |
|    time_elapsed     | 32453    |
|    total_timesteps  | 56505    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0106   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.75     |
|    ep_rew_mean      | 9.75     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6200     |
|    fps              | 1        |
|    time_elapsed     | 32778    |
|    total_timesteps  | 57081    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0367   |
|    n_updates        | 13770    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.76     |
|    ep_rew_mean      | 9.76     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6204     |
|    fps              | 1        |
|    time_elapsed     | 32800    |
|    total_timesteps  | 57122    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0805   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.6      |
|    ep_rew_mean      | 9.6      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6264     |
|    fps              | 1        |
|    time_elapsed     | 33125    |
|    total_timesteps  | 57699    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0187   |
|    n_updates        | 13924    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.66     |
|    ep_rew_mean      | 9.66     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6268     |
|    fps              | 1        |
|    time_elapsed     | 33148    |
|    total_timesteps  | 57740    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0202   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.74     |
|    ep_rew_mean      | 9.74     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6328     |
|    fps              | 1        |
|    time_elapsed     | 33475    |
|    total_timesteps  | 58330    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0272   |
|    n_updates        | 14082    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.74     |
|    ep_rew_mean      | 9.74     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6332     |
|    fps              | 1        |
|    time_elapsed     | 33497    |
|    total_timesteps  | 58369    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0207   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.74     |
|    ep_rew_mean      | 9.74     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6392     |
|    fps              | 1        |
|    time_elapsed     | 33824    |
|    total_timesteps  | 58952    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0263   |
|    n_updates        | 14237    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.74     |
|    ep_rew_mean      | 9.74     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6396     |
|    fps              | 1        |
|    time_elapsed     | 33846    |
|    total_timesteps  | 58991    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0354   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.77     |
|    ep_rew_mean      | 9.77     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6456     |
|    fps              | 1        |
|    time_elapsed     | 34175    |
|    total_timesteps  | 59582    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0533   |
|    n_updates        | 14395    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.79     |
|    ep_rew_mean      | 9.79     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6460     |
|    fps              | 1        |
|    time_elapsed     | 34197    |
|    total_timesteps  | 59624    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0214   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.97     |
|    ep_rew_mean      | 9.97     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6520     |
|    fps              | 1        |
|    time_elapsed     | 34526    |
|    total_timesteps  | 60217    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.113    |
|    n_updates        | 14554    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.96     |
|    ep_rew_mean      | 9.96     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6524     |
|    fps              | 1        |
|    time_elapsed     | 34548    |
|    total_timesteps  | 60257    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0321   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.9      |
|    ep_rew_mean      | 9.9      |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6584     |
|    fps              | 1        |
|    time_elapsed     | 34879    |
|    total_timesteps  | 60852    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0302   |
|    n_updates        | 14712    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.89     |
|    ep_rew_mean      | 9.89     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6588     |
|    fps              | 1        |
|    time_elapsed     | 34901    |
|    total_timesteps  | 60891    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0414   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.96     |
|    ep_rew_mean      | 9.96     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6648     |
|    fps              | 1        |
|    time_elapsed     | 35231    |
|    total_timesteps  | 61485    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0357   |
|    n_updates        | 14871    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.97     |
|    ep_rew_mean      | 9.97     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6652     |
|    fps              | 1        |
|    time_elapsed     | 35253    |
|    total_timesteps  | 61525    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0218   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.96     |
|    ep_rew_mean      | 9.96     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6712     |
|    fps              | 1        |
|    time_elapsed     | 35585    |
|    total_timesteps  | 62123    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0374   |
|    n_updates        | 15030    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.94     |
|    ep_rew_mean      | 9.94     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6716     |
|    fps              | 1        |
|    time_elapsed     | 35607    |
|    total_timesteps  | 62161    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.025    |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.94     |
|    ep_rew_mean      | 9.94     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6776     |
|    fps              | 1        |
|    time_elapsed     | 35938    |
|    total_timesteps  | 62759    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0197   |
|    n_updates        | 15189    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.94     |
|    ep_rew_mean      | 9.94     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6780     |
|    fps              | 1        |
|    time_elapsed     | 35960    |
|    total_timesteps  | 62799    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0121   |
|    n_updates      

----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.93     |
|    ep_rew_mean      | 9.93     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6840     |
|    fps              | 1        |
|    time_elapsed     | 36292    |
|    total_timesteps  | 63396    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0146   |
|    n_updates        | 15348    |
----------------------------------
----------------------------------
| rollout/            |          |
|    ep_len_mean      | 9.92     |
|    ep_rew_mean      | 9.92     |
|    exploration_rate | 0.04     |
| time/               |          |
|    episodes         | 6844     |
|    fps              | 1        |
|    time_elapsed     | 36314    |
|    total_timesteps  | 63435    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0197   |
|    n_updates      

KeyboardInterrupt: 

In [None]:
# Saving the model
model.save("train/DQN-FlappyBird.zip")