In [1]:
import gymnasium as gym
from stable_baselines3 import SAC
from stable_baselines3.common.vec_env import DummyVecEnv, VecTransposeImage
from stable_baselines3.common.monitor import Monitor
from stable_baselines3.common.callbacks import CheckpointCallback, CallbackList
from stable_baselines3.common.logger import configure
from tqdm import trange

def make_env():
    env = gym.make("CarRacing-v3", render_mode="rgb_array", continuous=True)
    env = Monitor(env)  
    return env

env = DummyVecEnv([make_env])
env = VecTransposeImage(env)
log_dir = "./sac_logs/"
new_logger = configure(log_dir, ["stdout", "tensorboard"])

checkpoint_callback = CheckpointCallback(
    save_freq=100_000,
    save_path="./checkpoints/",
    name_prefix="sac_carracing"
)

model = SAC(
    policy="CnnPolicy",
    env=env,
    verbose=0,
    buffer_size= 80_000,
    learning_rate=3e-4,
    batch_size=64,
    train_freq=1,
    gradient_steps=1,
    ent_coef= "auto",
    tensorboard_log=log_dir,
    device="cuda"
)

model.set_logger(new_logger)

total_timesteps = 250_000
steps_per_iter = 10_000  

for _ in trange(total_timesteps // steps_per_iter, desc="Training Progress"):
    model.learn(total_timesteps=steps_per_iter, reset_num_timesteps=False, callback=checkpoint_callback)

model.save("sac_carracing_sb3")
print("Training complete. Model saved as 'sac_carracing_sb3'.")


Logging to ./sac_logs/
Starting training with tqdm and TensorBoard logging...


Training Progress:   0%|                                                                        | 0/25 [00:00<?, ?it/s]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -33.5    |
| time/              |          |
|    episodes        | 4        |
|    fps             | 28       |
|    time_elapsed    | 142      |
|    total_timesteps | 4000     |
| train/             |          |
|    actor_loss      | -18      |
|    critic_loss     | 0.176    |
|    ent_coef        | 0.311    |
|    ent_coef_loss   | -5.93    |
|    learning_rate   | 0.0003   |
|    n_updates       | 3899     |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -29.7    |
| time/              |          |
|    episodes        | 8        |
|    fps             | 27       |
|    time_elapsed    | 286      |
|    total_timesteps | 8000     |
| train/             |          |
|    actor_loss      | -20.1    |
|    critic_loss     | 0.359    |
|    ent_coef 

Training Progress:   4%|██▍                                                          | 1/25 [05:57<2:23:10, 357.93s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -31.4    |
| time/              |          |
|    episodes        | 12       |
|    fps             | 28       |
|    time_elapsed    | 71       |
|    total_timesteps | 12000    |
| train/             |          |
|    actor_loss      | -17      |
|    critic_loss     | 0.591    |
|    ent_coef        | 0.0282   |
|    ent_coef_loss   | -17.7    |
|    learning_rate   | 0.0003   |
|    n_updates       | 11899    |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -34.1    |
| time/              |          |
|    episodes        | 16       |
|    fps             | 27       |
|    time_elapsed    | 215      |
|    total_timesteps | 16000    |
| train/             |          |
|    actor_loss      | -13.5    |
|    critic_loss     | 0.431    |
|    ent_coef 

Training Progress:   8%|████▉                                                        | 2/25 [11:58<2:17:42, 359.24s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -40.3    |
| time/              |          |
|    episodes        | 24       |
|    fps             | 27       |
|    time_elapsed    | 144      |
|    total_timesteps | 24000    |
| train/             |          |
|    actor_loss      | -7.78    |
|    critic_loss     | 0.0104   |
|    ent_coef        | 0.000935 |
|    ent_coef_loss   | -15.5    |
|    learning_rate   | 0.0003   |
|    n_updates       | 23899    |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -44.2    |
| time/              |          |
|    episodes        | 28       |
|    fps             | 27       |
|    time_elapsed    | 288      |
|    total_timesteps | 28000    |
| train/             |          |
|    actor_loss      | -5.71    |
|    critic_loss     | 0.0188   |
|    ent_coef 

Training Progress:  12%|███████▎                                                     | 3/25 [17:59<2:12:08, 360.36s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -48.1    |
| time/              |          |
|    episodes        | 32       |
|    fps             | 27       |
|    time_elapsed    | 73       |
|    total_timesteps | 32000    |
| train/             |          |
|    actor_loss      | -4.03    |
|    critic_loss     | 0.272    |
|    ent_coef        | 0.0007   |
|    ent_coef_loss   | 5.56     |
|    learning_rate   | 0.0003   |
|    n_updates       | 31899    |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -49.4    |
| time/              |          |
|    episodes        | 36       |
|    fps             | 27       |
|    time_elapsed    | 217      |
|    total_timesteps | 36000    |
| train/             |          |
|    actor_loss      | -2.91    |
|    critic_loss     | 0.0242   |
|    ent_coef 

Training Progress:  16%|█████████▊                                                   | 4/25 [24:00<2:06:14, 360.68s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -44.3    |
| time/              |          |
|    episodes        | 44       |
|    fps             | 28       |
|    time_elapsed    | 142      |
|    total_timesteps | 44000    |
| train/             |          |
|    actor_loss      | -0.582   |
|    critic_loss     | 0.165    |
|    ent_coef        | 0.000351 |
|    ent_coef_loss   | 2.19     |
|    learning_rate   | 0.0003   |
|    n_updates       | 43899    |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -46.8    |
| time/              |          |
|    episodes        | 48       |
|    fps             | 27       |
|    time_elapsed    | 286      |
|    total_timesteps | 48000    |
| train/             |          |
|    actor_loss      | 0.68     |
|    critic_loss     | 0.123    |
|    ent_coef 

Training Progress:  20%|████████████▏                                                | 5/25 [29:58<1:59:52, 359.63s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -46.3    |
| time/              |          |
|    episodes        | 52       |
|    fps             | 27       |
|    time_elapsed    | 71       |
|    total_timesteps | 52000    |
| train/             |          |
|    actor_loss      | 1.22     |
|    critic_loss     | 0.301    |
|    ent_coef        | 0.00056  |
|    ent_coef_loss   | -11.2    |
|    learning_rate   | 0.0003   |
|    n_updates       | 51899    |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -46.3    |
| time/              |          |
|    episodes        | 56       |
|    fps             | 27       |
|    time_elapsed    | 214      |
|    total_timesteps | 56000    |
| train/             |          |
|    actor_loss      | 1.74     |
|    critic_loss     | 0.0946   |
|    ent_coef 

Training Progress:  24%|██████████████▋                                              | 6/25 [35:57<1:53:46, 359.29s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -44.8    |
| time/              |          |
|    episodes        | 64       |
|    fps             | 27       |
|    time_elapsed    | 143      |
|    total_timesteps | 64000    |
| train/             |          |
|    actor_loss      | 3.67     |
|    critic_loss     | 0.0912   |
|    ent_coef        | 0.000416 |
|    ent_coef_loss   | 5.8      |
|    learning_rate   | 0.0003   |
|    n_updates       | 63899    |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 998      |
|    ep_rew_mean     | -47.4    |
| time/              |          |
|    episodes        | 68       |
|    fps             | 27       |
|    time_elapsed    | 282      |
|    total_timesteps | 67872    |
| train/             |          |
|    actor_loss      | 4.36     |
|    critic_loss     | 0.153    |
|    ent_coef 

Training Progress:  28%|█████████████████                                            | 7/25 [41:56<1:47:43, 359.10s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 998      |
|    ep_rew_mean     | -46.9    |
| time/              |          |
|    episodes        | 72       |
|    fps             | 27       |
|    time_elapsed    | 67       |
|    total_timesteps | 71872    |
| train/             |          |
|    actor_loss      | 5.21     |
|    critic_loss     | 0.0476   |
|    ent_coef        | 0.00043  |
|    ent_coef_loss   | 15.7     |
|    learning_rate   | 0.0003   |
|    n_updates       | 71771    |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 995      |
|    ep_rew_mean     | -47.8    |
| time/              |          |
|    episodes        | 76       |
|    fps             | 27       |
|    time_elapsed    | 202      |
|    total_timesteps | 75655    |
| train/             |          |
|    actor_loss      | 5.45     |
|    critic_loss     | 0.125    |
|    ent_coef 

Training Progress:  32%|███████████████████▌                                         | 8/25 [47:54<1:41:38, 358.75s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 996      |
|    ep_rew_mean     | -46.3    |
| time/              |          |
|    episodes        | 84       |
|    fps             | 28       |
|    time_elapsed    | 129      |
|    total_timesteps | 83655    |
| train/             |          |
|    actor_loss      | 6.84     |
|    critic_loss     | 0.0413   |
|    ent_coef        | 0.000565 |
|    ent_coef_loss   | -2.86    |
|    learning_rate   | 0.0003   |
|    n_updates       | 83554    |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 996      |
|    ep_rew_mean     | -47.1    |
| time/              |          |
|    episodes        | 88       |
|    fps             | 28       |
|    time_elapsed    | 272      |
|    total_timesteps | 87655    |
| train/             |          |
|    actor_loss      | 6.39     |
|    critic_loss     | 0.205    |
|    ent_coef 

Training Progress:  36%|█████████████████████▉                                       | 9/25 [53:50<1:35:26, 357.93s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 996      |
|    ep_rew_mean     | -46.7    |
| time/              |          |
|    episodes        | 92       |
|    fps             | 28       |
|    time_elapsed    | 58       |
|    total_timesteps | 91655    |
| train/             |          |
|    actor_loss      | 6.66     |
|    critic_loss     | 0.0558   |
|    ent_coef        | 0.000362 |
|    ent_coef_loss   | 0.395    |
|    learning_rate   | 0.0003   |
|    n_updates       | 91554    |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 996      |
|    ep_rew_mean     | -45.4    |
| time/              |          |
|    episodes        | 96       |
|    fps             | 28       |
|    time_elapsed    | 200      |
|    total_timesteps | 95655    |
| train/             |          |
|    actor_loss      | 8.07     |
|    critic_loss     | 0.0831   |
|    ent_coef 

Training Progress:  40%|████████████████████████                                    | 10/25 [59:44<1:29:13, 356.92s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 996      |
|    ep_rew_mean     | -46.3    |
| time/              |          |
|    episodes        | 104      |
|    fps             | 27       |
|    time_elapsed    | 129      |
|    total_timesteps | 103620   |
| train/             |          |
|    actor_loss      | 7.77     |
|    critic_loss     | 0.113    |
|    ent_coef        | 0.000288 |
|    ent_coef_loss   | 6.14     |
|    learning_rate   | 0.0003   |
|    n_updates       | 103519   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 996      |
|    ep_rew_mean     | -47.1    |
| time/              |          |
|    episodes        | 108      |
|    fps             | 28       |
|    time_elapsed    | 271      |
|    total_timesteps | 107620   |
| train/             |          |
|    actor_loss      | 7.98     |
|    critic_loss     | 0.121    |
|    ent_coef 

Training Progress:  44%|█████████████████████████▌                                | 11/25 [1:05:41<1:23:16, 356.93s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -48.9    |
| time/              |          |
|    episodes        | 112      |
|    fps             | 27       |
|    time_elapsed    | 51       |
|    total_timesteps | 111450   |
| train/             |          |
|    actor_loss      | 9.15     |
|    critic_loss     | 0.0961   |
|    ent_coef        | 0.000398 |
|    ent_coef_loss   | 6.48     |
|    learning_rate   | 0.0003   |
|    n_updates       | 111349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -48.7    |
| time/              |          |
|    episodes        | 116      |
|    fps             | 27       |
|    time_elapsed    | 195      |
|    total_timesteps | 115450   |
| train/             |          |
|    actor_loss      | 7.02     |
|    critic_loss     | 0.165    |
|    ent_coef 

Training Progress:  48%|███████████████████████████▊                              | 12/25 [1:11:39<1:17:22, 357.08s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -50.5    |
| time/              |          |
|    episodes        | 124      |
|    fps             | 27       |
|    time_elapsed    | 123      |
|    total_timesteps | 123450   |
| train/             |          |
|    actor_loss      | 8.82     |
|    critic_loss     | 0.384    |
|    ent_coef        | 0.00145  |
|    ent_coef_loss   | 27.7     |
|    learning_rate   | 0.0003   |
|    n_updates       | 123349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -50.8    |
| time/              |          |
|    episodes        | 128      |
|    fps             | 28       |
|    time_elapsed    | 265      |
|    total_timesteps | 127450   |
| train/             |          |
|    actor_loss      | 8.91     |
|    critic_loss     | 0.198    |
|    ent_coef 

Training Progress:  52%|██████████████████████████████▏                           | 13/25 [1:17:36<1:11:26, 357.21s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -50.9    |
| time/              |          |
|    episodes        | 132      |
|    fps             | 28       |
|    time_elapsed    | 51       |
|    total_timesteps | 131450   |
| train/             |          |
|    actor_loss      | 9.33     |
|    critic_loss     | 0.134    |
|    ent_coef        | 0.000765 |
|    ent_coef_loss   | 27.2     |
|    learning_rate   | 0.0003   |
|    n_updates       | 131349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -52.2    |
| time/              |          |
|    episodes        | 136      |
|    fps             | 27       |
|    time_elapsed    | 195      |
|    total_timesteps | 135450   |
| train/             |          |
|    actor_loss      | 8.5      |
|    critic_loss     | 0.246    |
|    ent_coef 

Training Progress:  56%|████████████████████████████████▍                         | 14/25 [1:23:34<1:05:30, 357.31s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -56.2    |
| time/              |          |
|    episodes        | 144      |
|    fps             | 28       |
|    time_elapsed    | 121      |
|    total_timesteps | 143450   |
| train/             |          |
|    actor_loss      | 9        |
|    critic_loss     | 0.135    |
|    ent_coef        | 0.000481 |
|    ent_coef_loss   | 8.75     |
|    learning_rate   | 0.0003   |
|    n_updates       | 143349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -56.6    |
| time/              |          |
|    episodes        | 148      |
|    fps             | 28       |
|    time_elapsed    | 263      |
|    total_timesteps | 147450   |
| train/             |          |
|    actor_loss      | 8.98     |
|    critic_loss     | 0.0711   |
|    ent_coef 

Training Progress:  60%|████████████████████████████████████                        | 15/25 [1:29:28<59:23, 356.31s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -58.3    |
| time/              |          |
|    episodes        | 152      |
|    fps             | 28       |
|    time_elapsed    | 51       |
|    total_timesteps | 151450   |
| train/             |          |
|    actor_loss      | 8.56     |
|    critic_loss     | 0.0908   |
|    ent_coef        | 0.00108  |
|    ent_coef_loss   | -3.18    |
|    learning_rate   | 0.0003   |
|    n_updates       | 151349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -59.6    |
| time/              |          |
|    episodes        | 156      |
|    fps             | 28       |
|    time_elapsed    | 194      |
|    total_timesteps | 155450   |
| train/             |          |
|    actor_loss      | 9.36     |
|    critic_loss     | 0.056    |
|    ent_coef 

Training Progress:  64%|██████████████████████████████████████▍                     | 16/25 [1:35:24<53:26, 356.30s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 994      |
|    ep_rew_mean     | -63.5    |
| time/              |          |
|    episodes        | 164      |
|    fps             | 27       |
|    time_elapsed    | 123      |
|    total_timesteps | 163450   |
| train/             |          |
|    actor_loss      | 9.48     |
|    critic_loss     | 0.572    |
|    ent_coef        | 0.00192  |
|    ent_coef_loss   | 4.92     |
|    learning_rate   | 0.0003   |
|    n_updates       | 163349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 996      |
|    ep_rew_mean     | -63.5    |
| time/              |          |
|    episodes        | 168      |
|    fps             | 28       |
|    time_elapsed    | 265      |
|    total_timesteps | 167450   |
| train/             |          |
|    actor_loss      | 8.1      |
|    critic_loss     | 0.178    |
|    ent_coef 

Training Progress:  68%|████████████████████████████████████████▊                   | 17/25 [1:41:20<47:29, 356.22s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 996      |
|    ep_rew_mean     | -65.2    |
| time/              |          |
|    episodes        | 172      |
|    fps             | 28       |
|    time_elapsed    | 51       |
|    total_timesteps | 171450   |
| train/             |          |
|    actor_loss      | 7.89     |
|    critic_loss     | 0.0491   |
|    ent_coef        | 0.00317  |
|    ent_coef_loss   | -12.4    |
|    learning_rate   | 0.0003   |
|    n_updates       | 171349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 998      |
|    ep_rew_mean     | -66      |
| time/              |          |
|    episodes        | 176      |
|    fps             | 28       |
|    time_elapsed    | 194      |
|    total_timesteps | 175450   |
| train/             |          |
|    actor_loss      | 9.09     |
|    critic_loss     | 0.14     |
|    ent_coef 

Training Progress:  72%|███████████████████████████████████████████▏                | 18/25 [1:47:17<41:35, 356.54s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 998      |
|    ep_rew_mean     | -69.4    |
| time/              |          |
|    episodes        | 184      |
|    fps             | 27       |
|    time_elapsed    | 123      |
|    total_timesteps | 183450   |
| train/             |          |
|    actor_loss      | 9.11     |
|    critic_loss     | 0.134    |
|    ent_coef        | 0.000472 |
|    ent_coef_loss   | -10.8    |
|    learning_rate   | 0.0003   |
|    n_updates       | 183349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 998      |
|    ep_rew_mean     | -70.4    |
| time/              |          |
|    episodes        | 188      |
|    fps             | 27       |
|    time_elapsed    | 266      |
|    total_timesteps | 187450   |
| train/             |          |
|    actor_loss      | 8.62     |
|    critic_loss     | 0.0361   |
|    ent_coef 

Training Progress:  76%|█████████████████████████████████████████████▌              | 19/25 [1:53:15<35:40, 356.80s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 998      |
|    ep_rew_mean     | -72.1    |
| time/              |          |
|    episodes        | 192      |
|    fps             | 27       |
|    time_elapsed    | 52       |
|    total_timesteps | 191450   |
| train/             |          |
|    actor_loss      | 8.99     |
|    critic_loss     | 0.0422   |
|    ent_coef        | 0.000973 |
|    ent_coef_loss   | -3.9     |
|    learning_rate   | 0.0003   |
|    n_updates       | 191349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 998      |
|    ep_rew_mean     | -74.8    |
| time/              |          |
|    episodes        | 196      |
|    fps             | 27       |
|    time_elapsed    | 196      |
|    total_timesteps | 195450   |
| train/             |          |
|    actor_loss      | 9.11     |
|    critic_loss     | 0.108    |
|    ent_coef 

Training Progress:  80%|████████████████████████████████████████████████            | 20/25 [1:59:15<29:49, 357.96s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 998      |
|    ep_rew_mean     | -76.7    |
| time/              |          |
|    episodes        | 204      |
|    fps             | 27       |
|    time_elapsed    | 124      |
|    total_timesteps | 203450   |
| train/             |          |
|    actor_loss      | 9.37     |
|    critic_loss     | 0.155    |
|    ent_coef        | 0.00155  |
|    ent_coef_loss   | -0.158   |
|    learning_rate   | 0.0003   |
|    n_updates       | 203349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 998      |
|    ep_rew_mean     | -77.8    |
| time/              |          |
|    episodes        | 208      |
|    fps             | 27       |
|    time_elapsed    | 267      |
|    total_timesteps | 207450   |
| train/             |          |
|    actor_loss      | 9.85     |
|    critic_loss     | 0.0585   |
|    ent_coef 

Training Progress:  84%|██████████████████████████████████████████████████▍         | 21/25 [2:05:13<23:51, 357.82s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -77.9    |
| time/              |          |
|    episodes        | 212      |
|    fps             | 28       |
|    time_elapsed    | 51       |
|    total_timesteps | 211450   |
| train/             |          |
|    actor_loss      | 9.89     |
|    critic_loss     | 0.105    |
|    ent_coef        | 0.0015   |
|    ent_coef_loss   | 5.86     |
|    learning_rate   | 0.0003   |
|    n_updates       | 211349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -79.8    |
| time/              |          |
|    episodes        | 216      |
|    fps             | 28       |
|    time_elapsed    | 194      |
|    total_timesteps | 215450   |
| train/             |          |
|    actor_loss      | 9.71     |
|    critic_loss     | 0.0545   |
|    ent_coef 

Training Progress:  88%|████████████████████████████████████████████████████▊       | 22/25 [2:11:10<17:52, 357.66s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -80.3    |
| time/              |          |
|    episodes        | 224      |
|    fps             | 27       |
|    time_elapsed    | 123      |
|    total_timesteps | 223450   |
| train/             |          |
|    actor_loss      | 10.6     |
|    critic_loss     | 0.033    |
|    ent_coef        | 0.00123  |
|    ent_coef_loss   | 0.235    |
|    learning_rate   | 0.0003   |
|    n_updates       | 223349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -80.5    |
| time/              |          |
|    episodes        | 228      |
|    fps             | 27       |
|    time_elapsed    | 266      |
|    total_timesteps | 227450   |
| train/             |          |
|    actor_loss      | 11.2     |
|    critic_loss     | 0.0251   |
|    ent_coef 

Training Progress:  92%|███████████████████████████████████████████████████████▏    | 23/25 [2:17:08<11:55, 357.59s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -79.7    |
| time/              |          |
|    episodes        | 232      |
|    fps             | 28       |
|    time_elapsed    | 51       |
|    total_timesteps | 231450   |
| train/             |          |
|    actor_loss      | 10.3     |
|    critic_loss     | 0.0936   |
|    ent_coef        | 0.00123  |
|    ent_coef_loss   | 6.69     |
|    learning_rate   | 0.0003   |
|    n_updates       | 231349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -79.3    |
| time/              |          |
|    episodes        | 236      |
|    fps             | 27       |
|    time_elapsed    | 195      |
|    total_timesteps | 235450   |
| train/             |          |
|    actor_loss      | 11       |
|    critic_loss     | 0.0133   |
|    ent_coef 

Training Progress:  96%|█████████████████████████████████████████████████████████▌  | 24/25 [2:23:06<05:57, 357.85s/it]

---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -80.2    |
| time/              |          |
|    episodes        | 244      |
|    fps             | 27       |
|    time_elapsed    | 123      |
|    total_timesteps | 243450   |
| train/             |          |
|    actor_loss      | 10       |
|    critic_loss     | 0.0595   |
|    ent_coef        | 0.00114  |
|    ent_coef_loss   | -0.75    |
|    learning_rate   | 0.0003   |
|    n_updates       | 243349   |
---------------------------------
---------------------------------
| rollout/           |          |
|    ep_len_mean     | 1e+03    |
|    ep_rew_mean     | -79.8    |
| time/              |          |
|    episodes        | 248      |
|    fps             | 28       |
|    time_elapsed    | 266      |
|    total_timesteps | 247450   |
| train/             |          |
|    actor_loss      | 10       |
|    critic_loss     | 0.00859  |
|    ent_coef 

Training Progress: 100%|████████████████████████████████████████████████████████████| 25/25 [2:29:03<00:00, 357.73s/it]

Training complete. Model saved as 'sac_carracing_sb3'.



