# Simulation 2.2 - Training the agents


## Importing libraries

In [1]:
import numpy as np
import matplotlib.pyplot as plt
from scipy.signal import savgol_filter as SGfilter
from IPython.display import clear_output, display
import datetime
import joblib
from tqdm import tqdm

import const
import utilities as ut


import gym
import ctfsql
from stable_baselines3.common.vec_env import DummyVecEnv
from stable_baselines3 import DQN
import evaluate as ev

## Defining the parameters of the simulations

In [2]:
n_simulations = 10
n_episodes_training = 10**6
n_episodes_test = 10**2

In [3]:
env = gym.make('ctfsql-v0')

dqn_models = [DQN('MlpPolicy', env, verbose=(i==0), exploration_final_eps = 0.1,exploration_initial_eps = 0.1) 
              for i in range(n_simulations)]

Using cpu device
Wrapping the env in a DummyVecEnv.


## Running the simulations

In [4]:
train_data = np.zeros((n_simulations,3,n_episodes_training))
test_data = np.zeros((n_simulations,3,n_episodes_test))

for i in tqdm(range(n_simulations)):
    dqn_models[i].learn(total_timesteps=10**6)
    timestamp = datetime.datetime.now().strftime("%Y%m%d%H%M%S%f")
    dqn_models[i].save(str(i) + 'ignore_simul5_'+timestamp)


  0%|                                                                                           | 0/10 [00:00<?, ?it/s]

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4        |
|    fps              | 20579    |
|    time_elapsed     | 0        |
|    total timesteps  | 103      |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8        |
|    fps              | 20751    |
|    time_elapsed     | 0        |
|    total timesteps  | 270      |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12       |
|    fps              | 20731    |
|    time_elapsed     | 0        |
|    total timesteps  | 498      |
----------------------------------
----------------------------------
| rollout/          

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 112      |
|    fps              | 22566    |
|    time_elapsed     | 0        |
|    total timesteps  | 6392     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 116      |
|    fps              | 22555    |
|    time_elapsed     | 0        |
|    total timesteps  | 6502     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 120      |
|    fps              | 22518    |
|    time_elapsed     | 0        |
|    total timesteps  | 6694     |
----------------------------------
----------------------------------
| rollout/          

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 220      |
|    fps              | 22558    |
|    time_elapsed     | 0        |
|    total timesteps  | 12825    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 224      |
|    fps              | 22537    |
|    time_elapsed     | 0        |
|    total timesteps  | 13061    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 228      |
|    fps              | 22575    |
|    time_elapsed     | 0        |
|    total timesteps  | 13490    |
----------------------------------
----------------------------------
| rollout/          

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 328      |
|    fps              | 22597    |
|    time_elapsed     | 0        |
|    total timesteps  | 18592    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 332      |
|    fps              | 22591    |
|    time_elapsed     | 0        |
|    total timesteps  | 18836    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 336      |
|    fps              | 22585    |
|    time_elapsed     | 0        |
|    total timesteps  | 18921    |
----------------------------------
----------------------------------
| rollout/          

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 436      |
|    fps              | 22477    |
|    time_elapsed     | 1        |
|    total timesteps  | 23915    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 440      |
|    fps              | 22469    |
|    time_elapsed     | 1        |
|    total timesteps  | 24064    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 444      |
|    fps              | 22492    |
|    time_elapsed     | 1        |
|    total timesteps  | 24427    |
----------------------------------
----------------------------------
| rollout/          

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 544      |
|    fps              | 22486    |
|    time_elapsed     | 1        |
|    total timesteps  | 29439    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 548      |
|    fps              | 22490    |
|    time_elapsed     | 1        |
|    total timesteps  | 29715    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 552      |
|    fps              | 22499    |
|    time_elapsed     | 1        |
|    total timesteps  | 29951    |
----------------------------------
----------------------------------
| rollout/          

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 652      |
|    fps              | 22474    |
|    time_elapsed     | 1        |
|    total timesteps  | 34867    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 656      |
|    fps              | 22458    |
|    time_elapsed     | 1        |
|    total timesteps  | 35000    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 660      |
|    fps              | 22457    |
|    time_elapsed     | 1        |
|    total timesteps  | 35133    |
----------------------------------
----------------------------------
| rollout/          

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 760      |
|    fps              | 22464    |
|    time_elapsed     | 1        |
|    total timesteps  | 39843    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 764      |
|    fps              | 22447    |
|    time_elapsed     | 1        |
|    total timesteps  | 40016    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 768      |
|    fps              | 22442    |
|    time_elapsed     | 1        |
|    total timesteps  | 40298    |
----------------------------------
----------------------------------
| rollout/          

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 868      |
|    fps              | 22444    |
|    time_elapsed     | 2        |
|    total timesteps  | 45199    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 872      |
|    fps              | 22435    |
|    time_elapsed     | 2        |
|    total timesteps  | 45405    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 876      |
|    fps              | 22429    |
|    time_elapsed     | 2        |
|    total timesteps  | 45484    |
----------------------------------
----------------------------------
| rollout/          

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 968      |
|    fps              | 4007     |
|    time_elapsed     | 13       |
|    total timesteps  | 55031    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00132  |
|    n_updates        | 1257     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 972      |
|    fps              | 3614     |
|    time_elapsed     | 15       |
|    total timesteps  | 55781    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.322    |
|    n_updates        | 1445     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1044     |
|    fps              | 1364     |
|    time_elapsed     | 51       |
|    total timesteps  | 70540    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.377    |
|    n_updates        | 5134     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1048     |
|    fps              | 1342     |
|    time_elapsed     | 52       |
|    total timesteps  | 71015    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.373    |
|    n_updates        | 5253     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1120     |
|    fps              | 1095     |
|    time_elapsed     | 71       |
|    total timesteps  | 78649    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.373    |
|    n_updates        | 7162     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1124     |
|    fps              | 1077     |
|    time_elapsed     | 73       |
|    total timesteps  | 79400    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00114  |
|    n_updates        | 7349     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1196     |
|    fps              | 951      |
|    time_elapsed     | 90       |
|    total timesteps  | 86315    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00209  |
|    n_updates        | 9078     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1200     |
|    fps              | 949      |
|    time_elapsed     | 90       |
|    total timesteps  | 86417    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.000795 |
|    n_updates        | 9104     |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1272     |
|    fps              | 873      |
|    time_elapsed     | 105      |
|    total timesteps  | 92276    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00197  |
|    n_updates        | 10568    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1276     |
|    fps              | 868      |
|    time_elapsed     | 106      |
|    total timesteps  | 92724    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00188  |
|    n_updates        | 10680    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1348     |
|    fps              | 819      |
|    time_elapsed     | 119      |
|    total timesteps  | 98091    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00162  |
|    n_updates        | 12022    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1352     |
|    fps              | 817      |
|    time_elapsed     | 120      |
|    total timesteps  | 98416    |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0014   |
|    n_updates        | 12103    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1424     |
|    fps              | 777      |
|    time_elapsed     | 133      |
|    total timesteps  | 103726   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00212  |
|    n_updates        | 13431    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1428     |
|    fps              | 776      |
|    time_elapsed     | 133      |
|    total timesteps  | 103930   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.889    |
|    n_updates        | 13482    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1500     |
|    fps              | 744      |
|    time_elapsed     | 146      |
|    total timesteps  | 109022   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00452  |
|    n_updates        | 14755    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1504     |
|    fps              | 743      |
|    time_elapsed     | 146      |
|    total timesteps  | 109163   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00284  |
|    n_updates        | 14790    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1576     |
|    fps              | 717      |
|    time_elapsed     | 158      |
|    total timesteps  | 114061   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00165  |
|    n_updates        | 16015    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1580     |
|    fps              | 715      |
|    time_elapsed     | 159      |
|    total timesteps  | 114465   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00157  |
|    n_updates        | 16116    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1652     |
|    fps              | 697      |
|    time_elapsed     | 169      |
|    total timesteps  | 118521   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.33     |
|    n_updates        | 17130    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1656     |
|    fps              | 695      |
|    time_elapsed     | 170      |
|    total timesteps  | 118933   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00166  |
|    n_updates        | 17233    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1728     |
|    fps              | 675      |
|    time_elapsed     | 184      |
|    total timesteps  | 124228   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.479    |
|    n_updates        | 18556    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1732     |
|    fps              | 673      |
|    time_elapsed     | 185      |
|    total timesteps  | 124778   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.51     |
|    n_updates        | 18694    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1804     |
|    fps              | 660      |
|    time_elapsed     | 194      |
|    total timesteps  | 128407   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0013   |
|    n_updates        | 19601    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1808     |
|    fps              | 660      |
|    time_elapsed     | 194      |
|    total timesteps  | 128482   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00309  |
|    n_updates        | 19620    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1880     |
|    fps              | 646      |
|    time_elapsed     | 205      |
|    total timesteps  | 133111   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.531    |
|    n_updates        | 20777    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1884     |
|    fps              | 645      |
|    time_elapsed     | 206      |
|    total timesteps  | 133415   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00435  |
|    n_updates        | 20853    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1956     |
|    fps              | 634      |
|    time_elapsed     | 216      |
|    total timesteps  | 137307   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00214  |
|    n_updates        | 21826    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 1960     |
|    fps              | 633      |
|    time_elapsed     | 216      |
|    total timesteps  | 137518   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00205  |
|    n_updates        | 21879    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2032     |
|    fps              | 623      |
|    time_elapsed     | 227      |
|    total timesteps  | 141501   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00198  |
|    n_updates        | 22875    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2036     |
|    fps              | 622      |
|    time_elapsed     | 227      |
|    total timesteps  | 141845   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.005    |
|    n_updates        | 22961    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2108     |
|    fps              | 610      |
|    time_elapsed     | 240      |
|    total timesteps  | 146911   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00483  |
|    n_updates        | 24227    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2112     |
|    fps              | 610      |
|    time_elapsed     | 241      |
|    total timesteps  | 147113   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00531  |
|    n_updates        | 24278    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2184     |
|    fps              | 601      |
|    time_elapsed     | 251      |
|    total timesteps  | 151443   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.586    |
|    n_updates        | 25360    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2188     |
|    fps              | 601      |
|    time_elapsed     | 252      |
|    total timesteps  | 151732   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.544    |
|    n_updates        | 25432    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2260     |
|    fps              | 592      |
|    time_elapsed     | 264      |
|    total timesteps  | 156570   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.563    |
|    n_updates        | 26642    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2264     |
|    fps              | 591      |
|    time_elapsed     | 265      |
|    total timesteps  | 157030   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.554    |
|    n_updates        | 26757    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2336     |
|    fps              | 583      |
|    time_elapsed     | 277      |
|    total timesteps  | 161798   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00448  |
|    n_updates        | 27949    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2340     |
|    fps              | 583      |
|    time_elapsed     | 278      |
|    total timesteps  | 162281   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0187   |
|    n_updates        | 28070    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2412     |
|    fps              | 575      |
|    time_elapsed     | 290      |
|    total timesteps  | 167171   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0134   |
|    n_updates        | 29292    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2416     |
|    fps              | 575      |
|    time_elapsed     | 290      |
|    total timesteps  | 167306   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.511    |
|    n_updates        | 29326    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2488     |
|    fps              | 568      |
|    time_elapsed     | 305      |
|    total timesteps  | 173274   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.71     |
|    n_updates        | 30818    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2492     |
|    fps              | 567      |
|    time_elapsed     | 306      |
|    total timesteps  | 173802   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00427  |
|    n_updates        | 30950    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2564     |
|    fps              | 560      |
|    time_elapsed     | 320      |
|    total timesteps  | 179373   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0031   |
|    n_updates        | 32343    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2568     |
|    fps              | 560      |
|    time_elapsed     | 320      |
|    total timesteps  | 179711   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0046   |
|    n_updates        | 32427    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2640     |
|    fps              | 552      |
|    time_elapsed     | 337      |
|    total timesteps  | 186486   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00421  |
|    n_updates        | 34121    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2644     |
|    fps              | 552      |
|    time_elapsed     | 337      |
|    total timesteps  | 186586   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.656    |
|    n_updates        | 34146    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2716     |
|    fps              | 546      |
|    time_elapsed     | 351      |
|    total timesteps  | 192361   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.716    |
|    n_updates        | 35590    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2720     |
|    fps              | 546      |
|    time_elapsed     | 352      |
|    total timesteps  | 192702   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00267  |
|    n_updates        | 35675    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2792     |
|    fps              | 542      |
|    time_elapsed     | 363      |
|    total timesteps  | 197194   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.691    |
|    n_updates        | 36798    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2796     |
|    fps              | 542      |
|    time_elapsed     | 364      |
|    total timesteps  | 197525   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.06     |
|    n_updates        | 36881    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2868     |
|    fps              | 538      |
|    time_elapsed     | 375      |
|    total timesteps  | 202343   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00603  |
|    n_updates        | 38085    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2872     |
|    fps              | 538      |
|    time_elapsed     | 376      |
|    total timesteps  | 202546   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.699    |
|    n_updates        | 38136    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2944     |
|    fps              | 534      |
|    time_elapsed     | 387      |
|    total timesteps  | 207367   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.034    |
|    n_updates        | 39341    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 2948     |
|    fps              | 534      |
|    time_elapsed     | 388      |
|    total timesteps  | 207718   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.696    |
|    n_updates        | 39429    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3020     |
|    fps              | 529      |
|    time_elapsed     | 401      |
|    total timesteps  | 212697   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0248   |
|    n_updates        | 40674    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3024     |
|    fps              | 529      |
|    time_elapsed     | 402      |
|    total timesteps  | 212977   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.29     |
|    n_updates        | 40744    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3096     |
|    fps              | 526      |
|    time_elapsed     | 412      |
|    total timesteps  | 217032   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0968   |
|    n_updates        | 41757    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3100     |
|    fps              | 525      |
|    time_elapsed     | 413      |
|    total timesteps  | 217320   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.647    |
|    n_updates        | 41829    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3172     |
|    fps              | 522      |
|    time_elapsed     | 424      |
|    total timesteps  | 221814   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.762    |
|    n_updates        | 42953    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3176     |
|    fps              | 522      |
|    time_elapsed     | 425      |
|    total timesteps  | 222033   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0595   |
|    n_updates        | 43008    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3248     |
|    fps              | 519      |
|    time_elapsed     | 434      |
|    total timesteps  | 225946   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0146   |
|    n_updates        | 43986    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3252     |
|    fps              | 519      |
|    time_elapsed     | 434      |
|    total timesteps  | 226066   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.662    |
|    n_updates        | 44016    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3324     |
|    fps              | 516      |
|    time_elapsed     | 446      |
|    total timesteps  | 230806   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00593  |
|    n_updates        | 45201    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3328     |
|    fps              | 516      |
|    time_elapsed     | 446      |
|    total timesteps  | 230993   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00418  |
|    n_updates        | 45248    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3400     |
|    fps              | 513      |
|    time_elapsed     | 460      |
|    total timesteps  | 236354   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.389    |
|    n_updates        | 46588    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3404     |
|    fps              | 513      |
|    time_elapsed     | 460      |
|    total timesteps  | 236575   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.648    |
|    n_updates        | 46643    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3476     |
|    fps              | 510      |
|    time_elapsed     | 471      |
|    total timesteps  | 240982   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.898    |
|    n_updates        | 47745    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3480     |
|    fps              | 510      |
|    time_elapsed     | 472      |
|    total timesteps  | 241198   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0729   |
|    n_updates        | 47799    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3552     |
|    fps              | 508      |
|    time_elapsed     | 483      |
|    total timesteps  | 245841   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.833    |
|    n_updates        | 48960    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3556     |
|    fps              | 508      |
|    time_elapsed     | 484      |
|    total timesteps  | 246249   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00415  |
|    n_updates        | 49062    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3628     |
|    fps              | 505      |
|    time_elapsed     | 495      |
|    total timesteps  | 250746   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00708  |
|    n_updates        | 50186    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3632     |
|    fps              | 505      |
|    time_elapsed     | 495      |
|    total timesteps  | 250798   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.77     |
|    n_updates        | 50199    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3704     |
|    fps              | 503      |
|    time_elapsed     | 505      |
|    total timesteps  | 254881   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.182    |
|    n_updates        | 51220    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3708     |
|    fps              | 503      |
|    time_elapsed     | 506      |
|    total timesteps  | 255065   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.778    |
|    n_updates        | 51266    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3780     |
|    fps              | 501      |
|    time_elapsed     | 517      |
|    total timesteps  | 259734   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.664    |
|    n_updates        | 52433    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3784     |
|    fps              | 501      |
|    time_elapsed     | 519      |
|    total timesteps  | 260247   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0092   |
|    n_updates        | 52561    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3856     |
|    fps              | 499      |
|    time_elapsed     | 529      |
|    total timesteps  | 264437   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0119   |
|    n_updates        | 53609    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3860     |
|    fps              | 499      |
|    time_elapsed     | 529      |
|    total timesteps  | 264571   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.82     |
|    n_updates        | 53642    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3932     |
|    fps              | 498      |
|    time_elapsed     | 537      |
|    total timesteps  | 267724   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00534  |
|    n_updates        | 54430    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 3936     |
|    fps              | 497      |
|    time_elapsed     | 537      |
|    total timesteps  | 267906   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0059   |
|    n_updates        | 54476    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4008     |
|    fps              | 496      |
|    time_elapsed     | 548      |
|    total timesteps  | 272208   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.32     |
|    n_updates        | 55551    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4012     |
|    fps              | 496      |
|    time_elapsed     | 548      |
|    total timesteps  | 272273   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0046   |
|    n_updates        | 55568    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4084     |
|    fps              | 495      |
|    time_elapsed     | 558      |
|    total timesteps  | 276474   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00618  |
|    n_updates        | 56618    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4088     |
|    fps              | 494      |
|    time_elapsed     | 559      |
|    total timesteps  | 276722   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0138   |
|    n_updates        | 56680    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4160     |
|    fps              | 493      |
|    time_elapsed     | 570      |
|    total timesteps  | 281395   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00411  |
|    n_updates        | 57848    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4164     |
|    fps              | 493      |
|    time_elapsed     | 571      |
|    total timesteps  | 281708   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0044   |
|    n_updates        | 57926    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4236     |
|    fps              | 491      |
|    time_elapsed     | 580      |
|    total timesteps  | 285670   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00469  |
|    n_updates        | 58917    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4240     |
|    fps              | 491      |
|    time_elapsed     | 581      |
|    total timesteps  | 285864   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.318    |
|    n_updates        | 58965    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4312     |
|    fps              | 490      |
|    time_elapsed     | 589      |
|    total timesteps  | 289195   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00344  |
|    n_updates        | 59798    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4316     |
|    fps              | 490      |
|    time_elapsed     | 589      |
|    total timesteps  | 289461   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00474  |
|    n_updates        | 59865    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4388     |
|    fps              | 489      |
|    time_elapsed     | 601      |
|    total timesteps  | 294212   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.79     |
|    n_updates        | 61052    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4392     |
|    fps              | 489      |
|    time_elapsed     | 601      |
|    total timesteps  | 294226   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0875   |
|    n_updates        | 61056    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4464     |
|    fps              | 488      |
|    time_elapsed     | 610      |
|    total timesteps  | 297874   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.103    |
|    n_updates        | 61968    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4468     |
|    fps              | 488      |
|    time_elapsed     | 610      |
|    total timesteps  | 298078   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00605  |
|    n_updates        | 62019    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4540     |
|    fps              | 487      |
|    time_elapsed     | 619      |
|    total timesteps  | 301598   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0103   |
|    n_updates        | 62899    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4544     |
|    fps              | 487      |
|    time_elapsed     | 619      |
|    total timesteps  | 301814   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.725    |
|    n_updates        | 62953    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4616     |
|    fps              | 485      |
|    time_elapsed     | 631      |
|    total timesteps  | 306593   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.181    |
|    n_updates        | 64148    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4620     |
|    fps              | 485      |
|    time_elapsed     | 631      |
|    total timesteps  | 306905   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00815  |
|    n_updates        | 64226    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4692     |
|    fps              | 484      |
|    time_elapsed     | 640      |
|    total timesteps  | 310273   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.271    |
|    n_updates        | 65068    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4696     |
|    fps              | 484      |
|    time_elapsed     | 640      |
|    total timesteps  | 310371   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.964    |
|    n_updates        | 65092    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4768     |
|    fps              | 483      |
|    time_elapsed     | 649      |
|    total timesteps  | 314318   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.135    |
|    n_updates        | 66079    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4772     |
|    fps              | 483      |
|    time_elapsed     | 650      |
|    total timesteps  | 314616   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0134   |
|    n_updates        | 66153    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4844     |
|    fps              | 482      |
|    time_elapsed     | 660      |
|    total timesteps  | 318598   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00739  |
|    n_updates        | 67149    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4848     |
|    fps              | 482      |
|    time_elapsed     | 660      |
|    total timesteps  | 318722   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0094   |
|    n_updates        | 67180    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4920     |
|    fps              | 481      |
|    time_elapsed     | 670      |
|    total timesteps  | 322881   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.92     |
|    n_updates        | 68220    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4924     |
|    fps              | 481      |
|    time_elapsed     | 670      |
|    total timesteps  | 323047   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.19     |
|    n_updates        | 68261    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 4996     |
|    fps              | 480      |
|    time_elapsed     | 679      |
|    total timesteps  | 326390   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00737  |
|    n_updates        | 69097    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5000     |
|    fps              | 480      |
|    time_elapsed     | 679      |
|    total timesteps  | 326521   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.745    |
|    n_updates        | 69130    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5072     |
|    fps              | 479      |
|    time_elapsed     | 689      |
|    total timesteps  | 330758   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0177   |
|    n_updates        | 70189    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5076     |
|    fps              | 479      |
|    time_elapsed     | 689      |
|    total timesteps  | 330822   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.957    |
|    n_updates        | 70205    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5148     |
|    fps              | 478      |
|    time_elapsed     | 697      |
|    total timesteps  | 334099   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00922  |
|    n_updates        | 71024    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5152     |
|    fps              | 478      |
|    time_elapsed     | 698      |
|    total timesteps  | 334325   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.897    |
|    n_updates        | 71081    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5224     |
|    fps              | 478      |
|    time_elapsed     | 706      |
|    total timesteps  | 337677   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.171    |
|    n_updates        | 71919    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5228     |
|    fps              | 477      |
|    time_elapsed     | 706      |
|    total timesteps  | 337773   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00586  |
|    n_updates        | 71943    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5300     |
|    fps              | 477      |
|    time_elapsed     | 715      |
|    total timesteps  | 341497   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.214    |
|    n_updates        | 72874    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5304     |
|    fps              | 477      |
|    time_elapsed     | 715      |
|    total timesteps  | 341541   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0169   |
|    n_updates        | 72885    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5376     |
|    fps              | 476      |
|    time_elapsed     | 723      |
|    total timesteps  | 344879   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00805  |
|    n_updates        | 73719    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5380     |
|    fps              | 476      |
|    time_elapsed     | 724      |
|    total timesteps  | 345033   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.91     |
|    n_updates        | 73758    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5452     |
|    fps              | 475      |
|    time_elapsed     | 732      |
|    total timesteps  | 348233   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.766    |
|    n_updates        | 74558    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5456     |
|    fps              | 475      |
|    time_elapsed     | 732      |
|    total timesteps  | 348274   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.982    |
|    n_updates        | 74568    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5528     |
|    fps              | 474      |
|    time_elapsed     | 740      |
|    total timesteps  | 351519   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.011    |
|    n_updates        | 75379    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5532     |
|    fps              | 474      |
|    time_elapsed     | 741      |
|    total timesteps  | 352084   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00751  |
|    n_updates        | 75520    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5604     |
|    fps              | 474      |
|    time_elapsed     | 748      |
|    total timesteps  | 355029   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.976    |
|    n_updates        | 76257    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5608     |
|    fps              | 474      |
|    time_elapsed     | 749      |
|    total timesteps  | 355386   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0154   |
|    n_updates        | 76346    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5680     |
|    fps              | 473      |
|    time_elapsed     | 759      |
|    total timesteps  | 359365   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00626  |
|    n_updates        | 77341    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5684     |
|    fps              | 473      |
|    time_elapsed     | 759      |
|    total timesteps  | 359453   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.321    |
|    n_updates        | 77363    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5756     |
|    fps              | 472      |
|    time_elapsed     | 768      |
|    total timesteps  | 363035   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.979    |
|    n_updates        | 78258    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5760     |
|    fps              | 472      |
|    time_elapsed     | 768      |
|    total timesteps  | 363069   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.01     |
|    n_updates        | 78267    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5832     |
|    fps              | 471      |
|    time_elapsed     | 778      |
|    total timesteps  | 367223   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00639  |
|    n_updates        | 79305    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5836     |
|    fps              | 471      |
|    time_elapsed     | 778      |
|    total timesteps  | 367323   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.76     |
|    n_updates        | 79330    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5908     |
|    fps              | 471      |
|    time_elapsed     | 784      |
|    total timesteps  | 369954   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00461  |
|    n_updates        | 79988    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5912     |
|    fps              | 471      |
|    time_elapsed     | 785      |
|    total timesteps  | 370016   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.809    |
|    n_updates        | 80003    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5984     |
|    fps              | 470      |
|    time_elapsed     | 791      |
|    total timesteps  | 372710   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00384  |
|    n_updates        | 80677    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 5988     |
|    fps              | 470      |
|    time_elapsed     | 792      |
|    total timesteps  | 373000   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.02     |
|    n_updates        | 80749    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6060     |
|    fps              | 470      |
|    time_elapsed     | 798      |
|    total timesteps  | 375376   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.13     |
|    n_updates        | 81343    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6064     |
|    fps              | 470      |
|    time_elapsed     | 798      |
|    total timesteps  | 375592   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0077   |
|    n_updates        | 81397    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6136     |
|    fps              | 469      |
|    time_elapsed     | 805      |
|    total timesteps  | 378142   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.77     |
|    n_updates        | 82035    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6140     |
|    fps              | 469      |
|    time_elapsed     | 805      |
|    total timesteps  | 378419   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.381    |
|    n_updates        | 82104    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6212     |
|    fps              | 468      |
|    time_elapsed     | 815      |
|    total timesteps  | 382167   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.02     |
|    n_updates        | 83041    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6216     |
|    fps              | 468      |
|    time_elapsed     | 815      |
|    total timesteps  | 382232   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.131    |
|    n_updates        | 83057    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6288     |
|    fps              | 467      |
|    time_elapsed     | 824      |
|    total timesteps  | 386048   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.011    |
|    n_updates        | 84011    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6292     |
|    fps              | 467      |
|    time_elapsed     | 825      |
|    total timesteps  | 386112   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0055   |
|    n_updates        | 84027    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6364     |
|    fps              | 467      |
|    time_elapsed     | 835      |
|    total timesteps  | 390394   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2        |
|    n_updates        | 85098    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6368     |
|    fps              | 467      |
|    time_elapsed     | 836      |
|    total timesteps  | 390739   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.34     |
|    n_updates        | 85184    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6440     |
|    fps              | 466      |
|    time_elapsed     | 844      |
|    total timesteps  | 394146   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.05     |
|    n_updates        | 86036    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6444     |
|    fps              | 466      |
|    time_elapsed     | 845      |
|    total timesteps  | 394603   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.08     |
|    n_updates        | 86150    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6516     |
|    fps              | 465      |
|    time_elapsed     | 854      |
|    total timesteps  | 398162   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.686    |
|    n_updates        | 87040    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6520     |
|    fps              | 465      |
|    time_elapsed     | 855      |
|    total timesteps  | 398425   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0183   |
|    n_updates        | 87106    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6592     |
|    fps              | 464      |
|    time_elapsed     | 865      |
|    total timesteps  | 402523   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.05     |
|    n_updates        | 88130    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6596     |
|    fps              | 464      |
|    time_elapsed     | 866      |
|    total timesteps  | 402616   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00415  |
|    n_updates        | 88153    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6668     |
|    fps              | 464      |
|    time_elapsed     | 872      |
|    total timesteps  | 405314   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0121   |
|    n_updates        | 88828    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6672     |
|    fps              | 464      |
|    time_elapsed     | 873      |
|    total timesteps  | 405350   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.06     |
|    n_updates        | 88837    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6744     |
|    fps              | 463      |
|    time_elapsed     | 883      |
|    total timesteps  | 409513   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00413  |
|    n_updates        | 89878    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6748     |
|    fps              | 463      |
|    time_elapsed     | 883      |
|    total timesteps  | 409583   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.73     |
|    n_updates        | 89895    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6820     |
|    fps              | 462      |
|    time_elapsed     | 893      |
|    total timesteps  | 413514   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.428    |
|    n_updates        | 90878    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6824     |
|    fps              | 462      |
|    time_elapsed     | 894      |
|    total timesteps  | 413714   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.806    |
|    n_updates        | 90928    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6896     |
|    fps              | 462      |
|    time_elapsed     | 902      |
|    total timesteps  | 417107   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00746  |
|    n_updates        | 91776    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6900     |
|    fps              | 462      |
|    time_elapsed     | 902      |
|    total timesteps  | 417293   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.271    |
|    n_updates        | 91823    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6972     |
|    fps              | 461      |
|    time_elapsed     | 912      |
|    total timesteps  | 421102   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00695  |
|    n_updates        | 92775    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 6976     |
|    fps              | 461      |
|    time_elapsed     | 912      |
|    total timesteps  | 421170   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.09     |
|    n_updates        | 92792    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7048     |
|    fps              | 461      |
|    time_elapsed     | 918      |
|    total timesteps  | 423528   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.706    |
|    n_updates        | 93381    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7052     |
|    fps              | 461      |
|    time_elapsed     | 918      |
|    total timesteps  | 423717   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.63     |
|    n_updates        | 93429    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7124     |
|    fps              | 460      |
|    time_elapsed     | 927      |
|    total timesteps  | 427057   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.22     |
|    n_updates        | 94264    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7128     |
|    fps              | 460      |
|    time_elapsed     | 927      |
|    total timesteps  | 427197   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.458    |
|    n_updates        | 94299    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7200     |
|    fps              | 460      |
|    time_elapsed     | 934      |
|    total timesteps  | 430018   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0829   |
|    n_updates        | 95004    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7204     |
|    fps              | 460      |
|    time_elapsed     | 934      |
|    total timesteps  | 430137   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.487    |
|    n_updates        | 95034    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7276     |
|    fps              | 459      |
|    time_elapsed     | 943      |
|    total timesteps  | 433576   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.1      |
|    n_updates        | 95893    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7280     |
|    fps              | 459      |
|    time_elapsed     | 944      |
|    total timesteps  | 433861   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.1      |
|    n_updates        | 95965    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7352     |
|    fps              | 459      |
|    time_elapsed     | 950      |
|    total timesteps  | 436630   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.11     |
|    n_updates        | 96657    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7356     |
|    fps              | 459      |
|    time_elapsed     | 951      |
|    total timesteps  | 436987   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.831    |
|    n_updates        | 96746    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7428     |
|    fps              | 458      |
|    time_elapsed     | 961      |
|    total timesteps  | 440987   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0401   |
|    n_updates        | 97746    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7432     |
|    fps              | 458      |
|    time_elapsed     | 961      |
|    total timesteps  | 441038   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.11     |
|    n_updates        | 97759    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7504     |
|    fps              | 458      |
|    time_elapsed     | 968      |
|    total timesteps  | 443832   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.332    |
|    n_updates        | 98457    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7508     |
|    fps              | 458      |
|    time_elapsed     | 968      |
|    total timesteps  | 443868   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.6      |
|    n_updates        | 98466    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7580     |
|    fps              | 457      |
|    time_elapsed     | 977      |
|    total timesteps  | 447218   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0135   |
|    n_updates        | 99304    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7584     |
|    fps              | 457      |
|    time_elapsed     | 978      |
|    total timesteps  | 447510   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.114    |
|    n_updates        | 99377    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7656     |
|    fps              | 456      |
|    time_elapsed     | 984      |
|    total timesteps  | 449902   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0114   |
|    n_updates        | 99975    |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7660     |
|    fps              | 456      |
|    time_elapsed     | 985      |
|    total timesteps  | 450182   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.63     |
|    n_updates        | 100045   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7732     |
|    fps              | 456      |
|    time_elapsed     | 994      |
|    total timesteps  | 454041   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0104   |
|    n_updates        | 101010   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7736     |
|    fps              | 456      |
|    time_elapsed     | 995      |
|    total timesteps  | 454344   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.13     |
|    n_updates        | 101085   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7808     |
|    fps              | 455      |
|    time_elapsed     | 1003     |
|    total timesteps  | 457612   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.752    |
|    n_updates        | 101902   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7812     |
|    fps              | 455      |
|    time_elapsed     | 1004     |
|    total timesteps  | 457798   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00825  |
|    n_updates        | 101949   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7884     |
|    fps              | 455      |
|    time_elapsed     | 1010     |
|    total timesteps  | 460464   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0183   |
|    n_updates        | 102615   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7888     |
|    fps              | 455      |
|    time_elapsed     | 1012     |
|    total timesteps  | 460958   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0171   |
|    n_updates        | 102739   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7960     |
|    fps              | 455      |
|    time_elapsed     | 1018     |
|    total timesteps  | 463466   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.11     |
|    n_updates        | 103366   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 7964     |
|    fps              | 455      |
|    time_elapsed     | 1018     |
|    total timesteps  | 463657   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00709  |
|    n_updates        | 103414   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8036     |
|    fps              | 454      |
|    time_elapsed     | 1025     |
|    total timesteps  | 466269   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00362  |
|    n_updates        | 104067   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8040     |
|    fps              | 454      |
|    time_elapsed     | 1025     |
|    total timesteps  | 466338   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0105   |
|    n_updates        | 104084   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8112     |
|    fps              | 454      |
|    time_elapsed     | 1033     |
|    total timesteps  | 469353   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00648  |
|    n_updates        | 104838   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8116     |
|    fps              | 454      |
|    time_elapsed     | 1033     |
|    total timesteps  | 469499   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.747    |
|    n_updates        | 104874   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8188     |
|    fps              | 453      |
|    time_elapsed     | 1038     |
|    total timesteps  | 471405   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0327   |
|    n_updates        | 105351   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8192     |
|    fps              | 453      |
|    time_elapsed     | 1038     |
|    total timesteps  | 471459   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.396    |
|    n_updates        | 105364   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8264     |
|    fps              | 453      |
|    time_elapsed     | 1044     |
|    total timesteps  | 473814   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.798    |
|    n_updates        | 105953   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8268     |
|    fps              | 453      |
|    time_elapsed     | 1044     |
|    total timesteps  | 473970   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.82     |
|    n_updates        | 105992   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8340     |
|    fps              | 453      |
|    time_elapsed     | 1052     |
|    total timesteps  | 476965   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00968  |
|    n_updates        | 106741   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8344     |
|    fps              | 453      |
|    time_elapsed     | 1052     |
|    total timesteps  | 477100   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.1      |
|    n_updates        | 106774   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8416     |
|    fps              | 452      |
|    time_elapsed     | 1062     |
|    total timesteps  | 481085   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0197   |
|    n_updates        | 107771   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8420     |
|    fps              | 452      |
|    time_elapsed     | 1062     |
|    total timesteps  | 481142   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0135   |
|    n_updates        | 107785   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8492     |
|    fps              | 452      |
|    time_elapsed     | 1072     |
|    total timesteps  | 485105   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00803  |
|    n_updates        | 108776   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8496     |
|    fps              | 452      |
|    time_elapsed     | 1072     |
|    total timesteps  | 485318   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.02     |
|    n_updates        | 108829   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8568     |
|    fps              | 451      |
|    time_elapsed     | 1082     |
|    total timesteps  | 489121   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.421    |
|    n_updates        | 109780   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8572     |
|    fps              | 451      |
|    time_elapsed     | 1082     |
|    total timesteps  | 489290   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.656    |
|    n_updates        | 109822   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8644     |
|    fps              | 451      |
|    time_elapsed     | 1089     |
|    total timesteps  | 492169   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.17     |
|    n_updates        | 110542   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8648     |
|    fps              | 451      |
|    time_elapsed     | 1089     |
|    total timesteps  | 492188   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.542    |
|    n_updates        | 110546   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8720     |
|    fps              | 451      |
|    time_elapsed     | 1096     |
|    total timesteps  | 495140   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.21     |
|    n_updates        | 111284   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8724     |
|    fps              | 451      |
|    time_elapsed     | 1098     |
|    total timesteps  | 495936   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.61     |
|    n_updates        | 111483   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8796     |
|    fps              | 451      |
|    time_elapsed     | 1105     |
|    total timesteps  | 498685   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0163   |
|    n_updates        | 112171   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8800     |
|    fps              | 451      |
|    time_elapsed     | 1105     |
|    total timesteps  | 498714   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.557    |
|    n_updates        | 112178   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8872     |
|    fps              | 450      |
|    time_elapsed     | 1114     |
|    total timesteps  | 502063   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.21     |
|    n_updates        | 113015   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8876     |
|    fps              | 450      |
|    time_elapsed     | 1114     |
|    total timesteps  | 502201   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0239   |
|    n_updates        | 113050   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8948     |
|    fps              | 450      |
|    time_elapsed     | 1122     |
|    total timesteps  | 505338   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.74     |
|    n_updates        | 113834   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 8952     |
|    fps              | 450      |
|    time_elapsed     | 1122     |
|    total timesteps  | 505485   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0119   |
|    n_updates        | 113871   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9024     |
|    fps              | 449      |
|    time_elapsed     | 1130     |
|    total timesteps  | 508705   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0102   |
|    n_updates        | 114676   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9028     |
|    fps              | 449      |
|    time_elapsed     | 1132     |
|    total timesteps  | 509158   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.288    |
|    n_updates        | 114789   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9100     |
|    fps              | 449      |
|    time_elapsed     | 1140     |
|    total timesteps  | 512345   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0107   |
|    n_updates        | 115586   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9104     |
|    fps              | 449      |
|    time_elapsed     | 1140     |
|    total timesteps  | 512381   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0199   |
|    n_updates        | 115595   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9176     |
|    fps              | 448      |
|    time_elapsed     | 1148     |
|    total timesteps  | 515592   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00835  |
|    n_updates        | 116397   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9180     |
|    fps              | 448      |
|    time_elapsed     | 1148     |
|    total timesteps  | 515726   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.2      |
|    n_updates        | 116431   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9252     |
|    fps              | 448      |
|    time_elapsed     | 1154     |
|    total timesteps  | 518137   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.292    |
|    n_updates        | 117034   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9256     |
|    fps              | 448      |
|    time_elapsed     | 1154     |
|    total timesteps  | 518160   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.582    |
|    n_updates        | 117039   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9328     |
|    fps              | 448      |
|    time_elapsed     | 1163     |
|    total timesteps  | 521445   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.304    |
|    n_updates        | 117861   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9332     |
|    fps              | 448      |
|    time_elapsed     | 1163     |
|    total timesteps  | 521602   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.22     |
|    n_updates        | 117900   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9404     |
|    fps              | 447      |
|    time_elapsed     | 1170     |
|    total timesteps  | 524462   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00969  |
|    n_updates        | 118615   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9408     |
|    fps              | 447      |
|    time_elapsed     | 1171     |
|    total timesteps  | 524699   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.37     |
|    n_updates        | 118674   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9480     |
|    fps              | 447      |
|    time_elapsed     | 1179     |
|    total timesteps  | 527689   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00782  |
|    n_updates        | 119422   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9484     |
|    fps              | 447      |
|    time_elapsed     | 1180     |
|    total timesteps  | 528140   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00491  |
|    n_updates        | 119534   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9556     |
|    fps              | 447      |
|    time_elapsed     | 1188     |
|    total timesteps  | 531382   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.58     |
|    n_updates        | 120345   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9560     |
|    fps              | 447      |
|    time_elapsed     | 1189     |
|    total timesteps  | 531685   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.67     |
|    n_updates        | 120421   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9632     |
|    fps              | 446      |
|    time_elapsed     | 1198     |
|    total timesteps  | 535310   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.75     |
|    n_updates        | 121327   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9636     |
|    fps              | 446      |
|    time_elapsed     | 1198     |
|    total timesteps  | 535441   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.26     |
|    n_updates        | 121360   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9708     |
|    fps              | 446      |
|    time_elapsed     | 1207     |
|    total timesteps  | 538795   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00522  |
|    n_updates        | 122198   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9712     |
|    fps              | 446      |
|    time_elapsed     | 1207     |
|    total timesteps  | 538819   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0145   |
|    n_updates        | 122204   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9784     |
|    fps              | 446      |
|    time_elapsed     | 1215     |
|    total timesteps  | 542278   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0154   |
|    n_updates        | 123069   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9788     |
|    fps              | 446      |
|    time_elapsed     | 1215     |
|    total timesteps  | 542294   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00792  |
|    n_updates        | 123073   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9860     |
|    fps              | 445      |
|    time_elapsed     | 1224     |
|    total timesteps  | 545839   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00513  |
|    n_updates        | 123959   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9864     |
|    fps              | 445      |
|    time_elapsed     | 1225     |
|    total timesteps  | 546015   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.46     |
|    n_updates        | 124003   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9936     |
|    fps              | 445      |
|    time_elapsed     | 1231     |
|    total timesteps  | 548701   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.24     |
|    n_updates        | 124675   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 9940     |
|    fps              | 445      |
|    time_elapsed     | 1232     |
|    total timesteps  | 548794   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0135   |
|    n_updates        | 124698   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10012    |
|    fps              | 444      |
|    time_elapsed     | 1242     |
|    total timesteps  | 552764   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.505    |
|    n_updates        | 125690   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10016    |
|    fps              | 444      |
|    time_elapsed     | 1242     |
|    total timesteps  | 553010   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.19     |
|    n_updates        | 125752   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10088    |
|    fps              | 444      |
|    time_elapsed     | 1250     |
|    total timesteps  | 556219   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.191    |
|    n_updates        | 126554   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10092    |
|    fps              | 444      |
|    time_elapsed     | 1251     |
|    total timesteps  | 556330   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00961  |
|    n_updates        | 126582   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10164    |
|    fps              | 444      |
|    time_elapsed     | 1260     |
|    total timesteps  | 559869   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.26     |
|    n_updates        | 127467   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10168    |
|    fps              | 444      |
|    time_elapsed     | 1260     |
|    total timesteps  | 560075   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.53     |
|    n_updates        | 127518   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10240    |
|    fps              | 444      |
|    time_elapsed     | 1266     |
|    total timesteps  | 562626   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.28     |
|    n_updates        | 128156   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10244    |
|    fps              | 444      |
|    time_elapsed     | 1267     |
|    total timesteps  | 562724   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.157    |
|    n_updates        | 128180   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10316    |
|    fps              | 443      |
|    time_elapsed     | 1273     |
|    total timesteps  | 565416   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.27     |
|    n_updates        | 128853   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10320    |
|    fps              | 443      |
|    time_elapsed     | 1274     |
|    total timesteps  | 565565   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.578    |
|    n_updates        | 128891   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10392    |
|    fps              | 443      |
|    time_elapsed     | 1283     |
|    total timesteps  | 569280   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0131   |
|    n_updates        | 129819   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10396    |
|    fps              | 443      |
|    time_elapsed     | 1283     |
|    total timesteps  | 569313   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.07     |
|    n_updates        | 129828   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10468    |
|    fps              | 443      |
|    time_elapsed     | 1292     |
|    total timesteps  | 572745   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.32     |
|    n_updates        | 130686   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10472    |
|    fps              | 443      |
|    time_elapsed     | 1292     |
|    total timesteps  | 572819   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.117    |
|    n_updates        | 130704   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10544    |
|    fps              | 442      |
|    time_elapsed     | 1303     |
|    total timesteps  | 577252   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.12     |
|    n_updates        | 131812   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10548    |
|    fps              | 442      |
|    time_elapsed     | 1304     |
|    total timesteps  | 577526   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.6      |
|    n_updates        | 131881   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10620    |
|    fps              | 442      |
|    time_elapsed     | 1314     |
|    total timesteps  | 581538   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.013    |
|    n_updates        | 132884   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10624    |
|    fps              | 442      |
|    time_elapsed     | 1315     |
|    total timesteps  | 581740   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.872    |
|    n_updates        | 132934   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10696    |
|    fps              | 442      |
|    time_elapsed     | 1324     |
|    total timesteps  | 585338   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.21     |
|    n_updates        | 133834   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10700    |
|    fps              | 442      |
|    time_elapsed     | 1324     |
|    total timesteps  | 585427   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.014    |
|    n_updates        | 133856   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10772    |
|    fps              | 441      |
|    time_elapsed     | 1333     |
|    total timesteps  | 589137   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.5      |
|    n_updates        | 134784   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10776    |
|    fps              | 441      |
|    time_elapsed     | 1333     |
|    total timesteps  | 589241   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.53     |
|    n_updates        | 134810   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10848    |
|    fps              | 441      |
|    time_elapsed     | 1343     |
|    total timesteps  | 593031   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0894   |
|    n_updates        | 135757   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10852    |
|    fps              | 441      |
|    time_elapsed     | 1343     |
|    total timesteps  | 593098   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.33     |
|    n_updates        | 135774   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10924    |
|    fps              | 441      |
|    time_elapsed     | 1352     |
|    total timesteps  | 596696   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.35     |
|    n_updates        | 136673   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 10928    |
|    fps              | 441      |
|    time_elapsed     | 1352     |
|    total timesteps  | 596809   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.34     |
|    n_updates        | 136702   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11000    |
|    fps              | 440      |
|    time_elapsed     | 1361     |
|    total timesteps  | 600277   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.54     |
|    n_updates        | 137569   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11004    |
|    fps              | 440      |
|    time_elapsed     | 1361     |
|    total timesteps  | 600470   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.024    |
|    n_updates        | 137617   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11076    |
|    fps              | 440      |
|    time_elapsed     | 1371     |
|    total timesteps  | 604201   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0174   |
|    n_updates        | 138550   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11080    |
|    fps              | 440      |
|    time_elapsed     | 1371     |
|    total timesteps  | 604494   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00582  |
|    n_updates        | 138623   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11152    |
|    fps              | 440      |
|    time_elapsed     | 1378     |
|    total timesteps  | 607251   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0151   |
|    n_updates        | 139312   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11156    |
|    fps              | 440      |
|    time_elapsed     | 1379     |
|    total timesteps  | 607420   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0128   |
|    n_updates        | 139354   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11228    |
|    fps              | 440      |
|    time_elapsed     | 1387     |
|    total timesteps  | 610628   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.778    |
|    n_updates        | 140156   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11232    |
|    fps              | 440      |
|    time_elapsed     | 1387     |
|    total timesteps  | 610861   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.011    |
|    n_updates        | 140215   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11304    |
|    fps              | 439      |
|    time_elapsed     | 1398     |
|    total timesteps  | 615204   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0201   |
|    n_updates        | 141300   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11308    |
|    fps              | 439      |
|    time_elapsed     | 1398     |
|    total timesteps  | 615369   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.301    |
|    n_updates        | 141342   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11380    |
|    fps              | 439      |
|    time_elapsed     | 1408     |
|    total timesteps  | 619017   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.748    |
|    n_updates        | 142254   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11384    |
|    fps              | 439      |
|    time_elapsed     | 1408     |
|    total timesteps  | 619113   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.36     |
|    n_updates        | 142278   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11456    |
|    fps              | 439      |
|    time_elapsed     | 1418     |
|    total timesteps  | 623178   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0093   |
|    n_updates        | 143294   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11460    |
|    fps              | 439      |
|    time_elapsed     | 1418     |
|    total timesteps  | 623204   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00556  |
|    n_updates        | 143300   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11532    |
|    fps              | 439      |
|    time_elapsed     | 1428     |
|    total timesteps  | 627025   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0985   |
|    n_updates        | 144256   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11536    |
|    fps              | 439      |
|    time_elapsed     | 1428     |
|    total timesteps  | 627210   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00946  |
|    n_updates        | 144302   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11608    |
|    fps              | 438      |
|    time_elapsed     | 1437     |
|    total timesteps  | 630873   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00747  |
|    n_updates        | 145218   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11612    |
|    fps              | 438      |
|    time_elapsed     | 1438     |
|    total timesteps  | 631326   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.38     |
|    n_updates        | 145331   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11684    |
|    fps              | 438      |
|    time_elapsed     | 1448     |
|    total timesteps  | 635368   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0143   |
|    n_updates        | 146341   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11688    |
|    fps              | 438      |
|    time_elapsed     | 1448     |
|    total timesteps  | 635401   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0208   |
|    n_updates        | 146350   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11760    |
|    fps              | 438      |
|    time_elapsed     | 1459     |
|    total timesteps  | 639662   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.34     |
|    n_updates        | 147415   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11764    |
|    fps              | 438      |
|    time_elapsed     | 1459     |
|    total timesteps  | 639810   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0118   |
|    n_updates        | 147452   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11836    |
|    fps              | 437      |
|    time_elapsed     | 1470     |
|    total timesteps  | 643900   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.4      |
|    n_updates        | 148474   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11840    |
|    fps              | 437      |
|    time_elapsed     | 1471     |
|    total timesteps  | 644224   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.38     |
|    n_updates        | 148555   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11912    |
|    fps              | 437      |
|    time_elapsed     | 1483     |
|    total timesteps  | 649059   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.38     |
|    n_updates        | 149764   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11916    |
|    fps              | 437      |
|    time_elapsed     | 1483     |
|    total timesteps  | 649211   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.44     |
|    n_updates        | 149802   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11988    |
|    fps              | 437      |
|    time_elapsed     | 1490     |
|    total timesteps  | 652023   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.59     |
|    n_updates        | 150505   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 11992    |
|    fps              | 437      |
|    time_elapsed     | 1490     |
|    total timesteps  | 652173   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0131   |
|    n_updates        | 150543   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12064    |
|    fps              | 437      |
|    time_elapsed     | 1503     |
|    total timesteps  | 657391   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.38     |
|    n_updates        | 151847   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12068    |
|    fps              | 437      |
|    time_elapsed     | 1504     |
|    total timesteps  | 657580   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.019    |
|    n_updates        | 151894   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12140    |
|    fps              | 436      |
|    time_elapsed     | 1515     |
|    total timesteps  | 662215   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0198   |
|    n_updates        | 153053   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12144    |
|    fps              | 436      |
|    time_elapsed     | 1516     |
|    total timesteps  | 662653   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0155   |
|    n_updates        | 153163   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12216    |
|    fps              | 436      |
|    time_elapsed     | 1526     |
|    total timesteps  | 666549   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.019    |
|    n_updates        | 154137   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12220    |
|    fps              | 436      |
|    time_elapsed     | 1527     |
|    total timesteps  | 666863   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.015    |
|    n_updates        | 154215   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12292    |
|    fps              | 436      |
|    time_elapsed     | 1539     |
|    total timesteps  | 671771   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0184   |
|    n_updates        | 155442   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12296    |
|    fps              | 436      |
|    time_elapsed     | 1539     |
|    total timesteps  | 671828   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0212   |
|    n_updates        | 155456   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12368    |
|    fps              | 435      |
|    time_elapsed     | 1551     |
|    total timesteps  | 676309   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.43     |
|    n_updates        | 156577   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12372    |
|    fps              | 435      |
|    time_elapsed     | 1551     |
|    total timesteps  | 676468   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.2      |
|    n_updates        | 156616   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12444    |
|    fps              | 435      |
|    time_elapsed     | 1560     |
|    total timesteps  | 680122   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0137   |
|    n_updates        | 157530   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12448    |
|    fps              | 435      |
|    time_elapsed     | 1561     |
|    total timesteps  | 680225   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0134   |
|    n_updates        | 157556   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12520    |
|    fps              | 435      |
|    time_elapsed     | 1570     |
|    total timesteps  | 684042   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.44     |
|    n_updates        | 158510   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12524    |
|    fps              | 435      |
|    time_elapsed     | 1571     |
|    total timesteps  | 684300   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00915  |
|    n_updates        | 158574   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12596    |
|    fps              | 435      |
|    time_elapsed     | 1584     |
|    total timesteps  | 689438   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0861   |
|    n_updates        | 159859   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12600    |
|    fps              | 435      |
|    time_elapsed     | 1584     |
|    total timesteps  | 689485   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0196   |
|    n_updates        | 159871   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12672    |
|    fps              | 434      |
|    time_elapsed     | 1595     |
|    total timesteps  | 693839   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.46     |
|    n_updates        | 160959   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12676    |
|    fps              | 434      |
|    time_elapsed     | 1596     |
|    total timesteps  | 694101   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00731  |
|    n_updates        | 161025   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12748    |
|    fps              | 434      |
|    time_elapsed     | 1605     |
|    total timesteps  | 697703   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0037   |
|    n_updates        | 161925   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12752    |
|    fps              | 434      |
|    time_elapsed     | 1606     |
|    total timesteps  | 698218   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.45     |
|    n_updates        | 162054   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12824    |
|    fps              | 434      |
|    time_elapsed     | 1617     |
|    total timesteps  | 702719   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00795  |
|    n_updates        | 163179   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12828    |
|    fps              | 434      |
|    time_elapsed     | 1618     |
|    total timesteps  | 702838   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.52     |
|    n_updates        | 163209   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12900    |
|    fps              | 434      |
|    time_elapsed     | 1627     |
|    total timesteps  | 706750   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.46     |
|    n_updates        | 164187   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12904    |
|    fps              | 434      |
|    time_elapsed     | 1628     |
|    total timesteps  | 707083   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.825    |
|    n_updates        | 164270   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12976    |
|    fps              | 433      |
|    time_elapsed     | 1643     |
|    total timesteps  | 712817   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0623   |
|    n_updates        | 165704   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 12980    |
|    fps              | 433      |
|    time_elapsed     | 1644     |
|    total timesteps  | 713323   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0147   |
|    n_updates        | 165830   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13052    |
|    fps              | 433      |
|    time_elapsed     | 1654     |
|    total timesteps  | 717180   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00697  |
|    n_updates        | 166794   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13056    |
|    fps              | 433      |
|    time_elapsed     | 1654     |
|    total timesteps  | 717431   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00987  |
|    n_updates        | 166857   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13128    |
|    fps              | 433      |
|    time_elapsed     | 1668     |
|    total timesteps  | 722841   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.5      |
|    n_updates        | 168210   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13132    |
|    fps              | 433      |
|    time_elapsed     | 1669     |
|    total timesteps  | 723038   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.42     |
|    n_updates        | 168259   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13204    |
|    fps              | 432      |
|    time_elapsed     | 1679     |
|    total timesteps  | 727302   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.53     |
|    n_updates        | 169325   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13208    |
|    fps              | 432      |
|    time_elapsed     | 1680     |
|    total timesteps  | 727634   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.99     |
|    n_updates        | 169408   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13280    |
|    fps              | 432      |
|    time_elapsed     | 1689     |
|    total timesteps  | 731128   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0193   |
|    n_updates        | 170281   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13284    |
|    fps              | 432      |
|    time_elapsed     | 1689     |
|    total timesteps  | 731251   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.48     |
|    n_updates        | 170312   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13356    |
|    fps              | 432      |
|    time_elapsed     | 1701     |
|    total timesteps  | 735923   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.04     |
|    n_updates        | 171480   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13360    |
|    fps              | 432      |
|    time_elapsed     | 1701     |
|    total timesteps  | 736102   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00883  |
|    n_updates        | 171525   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13432    |
|    fps              | 432      |
|    time_elapsed     | 1715     |
|    total timesteps  | 741297   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.56     |
|    n_updates        | 172824   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13436    |
|    fps              | 432      |
|    time_elapsed     | 1716     |
|    total timesteps  | 741970   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0171   |
|    n_updates        | 172992   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13508    |
|    fps              | 431      |
|    time_elapsed     | 1727     |
|    total timesteps  | 746177   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0288   |
|    n_updates        | 174044   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13512    |
|    fps              | 431      |
|    time_elapsed     | 1727     |
|    total timesteps  | 746193   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00885  |
|    n_updates        | 174048   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13584    |
|    fps              | 431      |
|    time_elapsed     | 1741     |
|    total timesteps  | 751586   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0108   |
|    n_updates        | 175396   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13588    |
|    fps              | 431      |
|    time_elapsed     | 1741     |
|    total timesteps  | 751822   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.51     |
|    n_updates        | 175455   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13660    |
|    fps              | 431      |
|    time_elapsed     | 1753     |
|    total timesteps  | 756565   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00802  |
|    n_updates        | 176641   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13664    |
|    fps              | 431      |
|    time_elapsed     | 1754     |
|    total timesteps  | 756936   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00588  |
|    n_updates        | 176733   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13736    |
|    fps              | 431      |
|    time_elapsed     | 1762     |
|    total timesteps  | 760001   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.112    |
|    n_updates        | 177500   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13740    |
|    fps              | 431      |
|    time_elapsed     | 1763     |
|    total timesteps  | 760296   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0135   |
|    n_updates        | 177573   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13812    |
|    fps              | 430      |
|    time_elapsed     | 1775     |
|    total timesteps  | 765065   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00704  |
|    n_updates        | 178766   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13816    |
|    fps              | 430      |
|    time_elapsed     | 1775     |
|    total timesteps  | 765098   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.49     |
|    n_updates        | 178774   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13888    |
|    fps              | 430      |
|    time_elapsed     | 1785     |
|    total timesteps  | 769359   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.278    |
|    n_updates        | 179839   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13892    |
|    fps              | 430      |
|    time_elapsed     | 1787     |
|    total timesteps  | 769995   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.5      |
|    n_updates        | 179998   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13964    |
|    fps              | 430      |
|    time_elapsed     | 1800     |
|    total timesteps  | 775360   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.14     |
|    n_updates        | 181339   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 13968    |
|    fps              | 430      |
|    time_elapsed     | 1801     |
|    total timesteps  | 775460   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0134   |
|    n_updates        | 181364   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14040    |
|    fps              | 430      |
|    time_elapsed     | 1812     |
|    total timesteps  | 779786   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00694  |
|    n_updates        | 182446   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14044    |
|    fps              | 430      |
|    time_elapsed     | 1812     |
|    total timesteps  | 779887   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00509  |
|    n_updates        | 182471   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14116    |
|    fps              | 430      |
|    time_elapsed     | 1823     |
|    total timesteps  | 784477   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00713  |
|    n_updates        | 183619   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14120    |
|    fps              | 430      |
|    time_elapsed     | 1823     |
|    total timesteps  | 784563   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0141   |
|    n_updates        | 183640   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14192    |
|    fps              | 429      |
|    time_elapsed     | 1836     |
|    total timesteps  | 789490   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 2.81     |
|    n_updates        | 184872   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14196    |
|    fps              | 429      |
|    time_elapsed     | 1837     |
|    total timesteps  | 789693   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.012    |
|    n_updates        | 184923   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14268    |
|    fps              | 429      |
|    time_elapsed     | 1846     |
|    total timesteps  | 793516   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0144   |
|    n_updates        | 185878   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14272    |
|    fps              | 429      |
|    time_elapsed     | 1847     |
|    total timesteps  | 793607   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.15     |
|    n_updates        | 185901   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14344    |
|    fps              | 429      |
|    time_elapsed     | 1856     |
|    total timesteps  | 797398   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.15     |
|    n_updates        | 186849   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14348    |
|    fps              | 429      |
|    time_elapsed     | 1856     |
|    total timesteps  | 797421   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.59     |
|    n_updates        | 186855   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14420    |
|    fps              | 429      |
|    time_elapsed     | 1868     |
|    total timesteps  | 802334   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.012    |
|    n_updates        | 188083   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14424    |
|    fps              | 429      |
|    time_elapsed     | 1870     |
|    total timesteps  | 802965   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0072   |
|    n_updates        | 188241   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14496    |
|    fps              | 429      |
|    time_elapsed     | 1881     |
|    total timesteps  | 807480   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.61     |
|    n_updates        | 189369   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14500    |
|    fps              | 429      |
|    time_elapsed     | 1882     |
|    total timesteps  | 807584   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.55     |
|    n_updates        | 189395   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14572    |
|    fps              | 428      |
|    time_elapsed     | 1896     |
|    total timesteps  | 813178   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00901  |
|    n_updates        | 190794   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14576    |
|    fps              | 428      |
|    time_elapsed     | 1897     |
|    total timesteps  | 813490   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00578  |
|    n_updates        | 190872   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14648    |
|    fps              | 428      |
|    time_elapsed     | 1908     |
|    total timesteps  | 817994   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.17     |
|    n_updates        | 191998   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14652    |
|    fps              | 428      |
|    time_elapsed     | 1909     |
|    total timesteps  | 818426   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.44     |
|    n_updates        | 192106   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14724    |
|    fps              | 428      |
|    time_elapsed     | 1917     |
|    total timesteps  | 821603   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.2      |
|    n_updates        | 192900   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14728    |
|    fps              | 428      |
|    time_elapsed     | 1918     |
|    total timesteps  | 821814   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.64     |
|    n_updates        | 192953   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14800    |
|    fps              | 428      |
|    time_elapsed     | 1928     |
|    total timesteps  | 826014   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00844  |
|    n_updates        | 194003   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14804    |
|    fps              | 428      |
|    time_elapsed     | 1929     |
|    total timesteps  | 826417   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00636  |
|    n_updates        | 194104   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14876    |
|    fps              | 428      |
|    time_elapsed     | 1941     |
|    total timesteps  | 831100   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0101   |
|    n_updates        | 195274   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14880    |
|    fps              | 428      |
|    time_elapsed     | 1941     |
|    total timesteps  | 831163   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0162   |
|    n_updates        | 195290   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14952    |
|    fps              | 427      |
|    time_elapsed     | 1953     |
|    total timesteps  | 835757   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00939  |
|    n_updates        | 196439   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 14956    |
|    fps              | 427      |
|    time_elapsed     | 1953     |
|    total timesteps  | 835862   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0103   |
|    n_updates        | 196465   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15028    |
|    fps              | 427      |
|    time_elapsed     | 1967     |
|    total timesteps  | 841447   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00756  |
|    n_updates        | 197861   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15032    |
|    fps              | 427      |
|    time_elapsed     | 1968     |
|    total timesteps  | 841634   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.62     |
|    n_updates        | 197908   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15104    |
|    fps              | 427      |
|    time_elapsed     | 1979     |
|    total timesteps  | 846060   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00909  |
|    n_updates        | 199014   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15108    |
|    fps              | 427      |
|    time_elapsed     | 1979     |
|    total timesteps  | 846120   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.011    |
|    n_updates        | 199029   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15180    |
|    fps              | 427      |
|    time_elapsed     | 1995     |
|    total timesteps  | 852285   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0196   |
|    n_updates        | 200571   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15184    |
|    fps              | 427      |
|    time_elapsed     | 1995     |
|    total timesteps  | 852362   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0104   |
|    n_updates        | 200590   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15256    |
|    fps              | 427      |
|    time_elapsed     | 2006     |
|    total timesteps  | 856670   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.66     |
|    n_updates        | 201667   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15260    |
|    fps              | 427      |
|    time_elapsed     | 2006     |
|    total timesteps  | 856978   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00609  |
|    n_updates        | 201744   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15332    |
|    fps              | 426      |
|    time_elapsed     | 2021     |
|    total timesteps  | 862807   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.67     |
|    n_updates        | 203201   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15336    |
|    fps              | 426      |
|    time_elapsed     | 2021     |
|    total timesteps  | 862985   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00605  |
|    n_updates        | 203246   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15408    |
|    fps              | 426      |
|    time_elapsed     | 2034     |
|    total timesteps  | 867952   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.25     |
|    n_updates        | 204487   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15412    |
|    fps              | 426      |
|    time_elapsed     | 2035     |
|    total timesteps  | 868340   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0048   |
|    n_updates        | 204584   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15484    |
|    fps              | 426      |
|    time_elapsed     | 2046     |
|    total timesteps  | 872913   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0053   |
|    n_updates        | 205728   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15488    |
|    fps              | 426      |
|    time_elapsed     | 2047     |
|    total timesteps  | 873062   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.019    |
|    n_updates        | 205765   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15560    |
|    fps              | 426      |
|    time_elapsed     | 2056     |
|    total timesteps  | 876755   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.65     |
|    n_updates        | 206688   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15564    |
|    fps              | 426      |
|    time_elapsed     | 2057     |
|    total timesteps  | 876919   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.64     |
|    n_updates        | 206729   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15636    |
|    fps              | 426      |
|    time_elapsed     | 2067     |
|    total timesteps  | 880829   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.64     |
|    n_updates        | 207707   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15640    |
|    fps              | 426      |
|    time_elapsed     | 2067     |
|    total timesteps  | 880973   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.67     |
|    n_updates        | 207743   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15712    |
|    fps              | 425      |
|    time_elapsed     | 2078     |
|    total timesteps  | 885399   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0145   |
|    n_updates        | 208849   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15716    |
|    fps              | 425      |
|    time_elapsed     | 2079     |
|    total timesteps  | 885457   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0122   |
|    n_updates        | 208864   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15788    |
|    fps              | 425      |
|    time_elapsed     | 2093     |
|    total timesteps  | 891037   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00672  |
|    n_updates        | 210259   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15792    |
|    fps              | 425      |
|    time_elapsed     | 2093     |
|    total timesteps  | 891187   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00647  |
|    n_updates        | 210296   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15864    |
|    fps              | 425      |
|    time_elapsed     | 2106     |
|    total timesteps  | 896331   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.7      |
|    n_updates        | 211582   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15868    |
|    fps              | 425      |
|    time_elapsed     | 2106     |
|    total timesteps  | 896469   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.69     |
|    n_updates        | 211617   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15940    |
|    fps              | 425      |
|    time_elapsed     | 2119     |
|    total timesteps  | 901331   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0091   |
|    n_updates        | 212832   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 15944    |
|    fps              | 425      |
|    time_elapsed     | 2120     |
|    total timesteps  | 901685   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0172   |
|    n_updates        | 212921   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16016    |
|    fps              | 425      |
|    time_elapsed     | 2133     |
|    total timesteps  | 907136   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00968  |
|    n_updates        | 214283   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16020    |
|    fps              | 425      |
|    time_elapsed     | 2134     |
|    total timesteps  | 907274   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.35     |
|    n_updates        | 214318   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16092    |
|    fps              | 424      |
|    time_elapsed     | 2146     |
|    total timesteps  | 912119   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.36     |
|    n_updates        | 215529   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16096    |
|    fps              | 424      |
|    time_elapsed     | 2147     |
|    total timesteps  | 912482   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.65     |
|    n_updates        | 215620   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16168    |
|    fps              | 424      |
|    time_elapsed     | 2159     |
|    total timesteps  | 917309   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00575  |
|    n_updates        | 216827   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16172    |
|    fps              | 424      |
|    time_elapsed     | 2160     |
|    total timesteps  | 917455   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.74     |
|    n_updates        | 216863   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16244    |
|    fps              | 424      |
|    time_elapsed     | 2171     |
|    total timesteps  | 921777   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0205   |
|    n_updates        | 217944   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16248    |
|    fps              | 424      |
|    time_elapsed     | 2172     |
|    total timesteps  | 922262   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.71     |
|    n_updates        | 218065   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16320    |
|    fps              | 424      |
|    time_elapsed     | 2181     |
|    total timesteps  | 925939   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00637  |
|    n_updates        | 218984   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16324    |
|    fps              | 424      |
|    time_elapsed     | 2182     |
|    total timesteps  | 926150   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00668  |
|    n_updates        | 219037   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16396    |
|    fps              | 424      |
|    time_elapsed     | 2195     |
|    total timesteps  | 931245   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.4      |
|    n_updates        | 220311   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16400    |
|    fps              | 424      |
|    time_elapsed     | 2195     |
|    total timesteps  | 931582   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0101   |
|    n_updates        | 220395   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16472    |
|    fps              | 424      |
|    time_elapsed     | 2206     |
|    total timesteps  | 935817   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0122   |
|    n_updates        | 221454   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16476    |
|    fps              | 424      |
|    time_elapsed     | 2207     |
|    total timesteps  | 935948   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0149   |
|    n_updates        | 221486   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16548    |
|    fps              | 423      |
|    time_elapsed     | 2216     |
|    total timesteps  | 939735   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.72     |
|    n_updates        | 222433   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16552    |
|    fps              | 423      |
|    time_elapsed     | 2216     |
|    total timesteps  | 939827   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.73     |
|    n_updates        | 222456   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16624    |
|    fps              | 423      |
|    time_elapsed     | 2229     |
|    total timesteps  | 944837   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00822  |
|    n_updates        | 223709   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16628    |
|    fps              | 423      |
|    time_elapsed     | 2230     |
|    total timesteps  | 945079   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00581  |
|    n_updates        | 223769   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16700    |
|    fps              | 423      |
|    time_elapsed     | 2242     |
|    total timesteps  | 950052   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.75     |
|    n_updates        | 225012   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16704    |
|    fps              | 423      |
|    time_elapsed     | 2243     |
|    total timesteps  | 950508   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.72     |
|    n_updates        | 225126   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16776    |
|    fps              | 423      |
|    time_elapsed     | 2257     |
|    total timesteps  | 955923   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.7      |
|    n_updates        | 226480   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16780    |
|    fps              | 423      |
|    time_elapsed     | 2257     |
|    total timesteps  | 956111   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0109   |
|    n_updates        | 226527   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16852    |
|    fps              | 423      |
|    time_elapsed     | 2269     |
|    total timesteps  | 960974   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.76     |
|    n_updates        | 227743   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16856    |
|    fps              | 423      |
|    time_elapsed     | 2270     |
|    total timesteps  | 961286   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.69     |
|    n_updates        | 227821   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16928    |
|    fps              | 423      |
|    time_elapsed     | 2281     |
|    total timesteps  | 965577   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.77     |
|    n_updates        | 228894   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 16932    |
|    fps              | 423      |
|    time_elapsed     | 2281     |
|    total timesteps  | 965893   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0137   |
|    n_updates        | 228973   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17004    |
|    fps              | 423      |
|    time_elapsed     | 2296     |
|    total timesteps  | 971652   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00707  |
|    n_updates        | 230412   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17008    |
|    fps              | 423      |
|    time_elapsed     | 2296     |
|    total timesteps  | 971864   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0112   |
|    n_updates        | 230465   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17080    |
|    fps              | 423      |
|    time_elapsed     | 2307     |
|    total timesteps  | 976073   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00763  |
|    n_updates        | 231518   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17084    |
|    fps              | 423      |
|    time_elapsed     | 2308     |
|    total timesteps  | 976473   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00824  |
|    n_updates        | 231618   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17156    |
|    fps              | 422      |
|    time_elapsed     | 2318     |
|    total timesteps  | 980538   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.74     |
|    n_updates        | 232634   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17160    |
|    fps              | 422      |
|    time_elapsed     | 2318     |
|    total timesteps  | 980722   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 1.75     |
|    n_updates        | 232680   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17232    |
|    fps              | 422      |
|    time_elapsed     | 2332     |
|    total timesteps  | 986314   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0135   |
|    n_updates        | 234078   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17236    |
|    fps              | 422      |
|    time_elapsed     | 2333     |
|    total timesteps  | 986454   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00375  |
|    n_updates        | 234113   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17308    |
|    fps              | 422      |
|    time_elapsed     | 2346     |
|    total timesteps  | 991648   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.013    |
|    n_updates        | 235411   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17312    |
|    fps              | 422      |
|    time_elapsed     | 2347     |
|    total timesteps  | 991966   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.0134   |
|    n_updates        | 235491   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17384    |
|    fps              | 422      |
|    time_elapsed     | 2359     |
|    total timesteps  | 997093   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 0.00674  |
|    n_updates        | 236773   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rate | 0.1      |
| time/               |          |
|    episodes         | 17388    |
|    fps              | 422      |
|    time_elapsed     | 2361     |
|    total timesteps  | 997662   |
| train/              |          |
|    learning_rate    | 0.0001   |
|    loss             | 3.55     |
|    n_updates        | 236915   |
----------------------------------
----------------------------------
| rollout/            |          |
|    exploration rat

100%|██████████████████████████████████████████████████████████████████████████████| 10/10 [6:21:22<00:00, 2288.25s/it]


In [5]:
for i in tqdm(range(n_simulations)):
    mean_reward, _ = ev.evaluate_random(gym.make('ctfsql-v0'), num_steps=10**5)
    print('random Mean reward: {0}'.format(mean_reward))
    mean_reward, _ = ev.evaluate_model(dqn_models[i], env, num_steps=10**5)
    print('dqn Mean reward: {0}'.format(mean_reward))

  0%|                                                                                           | 0/10 [00:00<?, ?it/s]

random Mean reward: -38.683


 10%|████████▏                                                                         | 1/10 [01:46<15:57, 106.42s/it]

dqn Mean reward: -102.391
random Mean reward: -38.658


 20%|████████████████▍                                                                 | 2/10 [03:32<14:08, 106.12s/it]

dqn Mean reward: 5.88
random Mean reward: -40.552


 30%|████████████████████████▌                                                         | 3/10 [05:17<12:20, 105.78s/it]

dqn Mean reward: -16.897
random Mean reward: -39.232


 40%|████████████████████████████████▊                                                 | 4/10 [07:03<10:34, 105.75s/it]

dqn Mean reward: -1.709
random Mean reward: -40.9


 50%|█████████████████████████████████████████                                         | 5/10 [08:49<08:48, 105.75s/it]

dqn Mean reward: 5.464
random Mean reward: -40.235


 60%|█████████████████████████████████████████████████▏                                | 6/10 [10:34<07:02, 105.69s/it]

dqn Mean reward: 5.241
random Mean reward: -40.579


 70%|█████████████████████████████████████████████████████████▍                        | 7/10 [12:20<05:17, 105.72s/it]

dqn Mean reward: -5.86
random Mean reward: -39.257


 80%|█████████████████████████████████████████████████████████████████▌                | 8/10 [14:15<03:37, 108.76s/it]

dqn Mean reward: 5.585
random Mean reward: -39.948


 90%|█████████████████████████████████████████████████████████████████████████▊        | 9/10 [16:10<01:50, 110.67s/it]

dqn Mean reward: -90.741
random Mean reward: -39.613


100%|█████████████████████████████████████████████████████████████████████████████████| 10/10 [18:05<00:00, 108.56s/it]

dqn Mean reward: -120.248





In [6]:
#The array of positive 1, and negative total scores 0 are: [0,1,0,0,1,1,1,1,0,1]
x = [0,1,0,0,1,1,1,1,0,1]
len(x), sum(x)

(10, 6)

In [7]:
import evaluate14 as ev2
for i in tqdm(range(n_simulations)):
    mean_reward, _, median_reward = ev2.evaluate_model_deterministic(dqn_models[i], env, num_steps=10**5)
    print('dqn Mean reward: {0} median reward {1}'.format(mean_reward, median_reward))

ModuleNotFoundError: No module named 'evaluate14'

In [None]:
import evaluate15 as ev2
for i in tqdm(range(n_simulations)):
    mean_reward, _, median_reward = ev2.evaluate_model_nondeter(dqn_models[i], env, num_steps=10**5)
    print('dqn Mean reward: {0} median reward {1}'.format(mean_reward, median_reward))