# Asynchronous Advantage Actor Critic (A3C)
---
In this notebook, we train A3C

### 1. Import the Necessary Packages

In [1]:
import os

import torch
import torch.multiprocessing as mp

import my_optim
from envs import create_atari_env
from model import ActorCritic
from test import test
from train import train

class args:
    lr = 0.0001
    gamma = 0.99
    gae_lambda = 1.00
    entropy_coef = 0.01
    value_loss_coef = 0.5
    max_grad_norm = 50
    seed = 1
    num_processes = 4
    num_steps = 255
    max_episode_length = 10000
    env_name = None
    no_shared = False
    

### 2. Instantiate the Environment and Agent

In [None]:
os.environ['OMP_NUM_THREADS'] = '1'
os.environ['CUDA_VISIBLE_DEVICES'] = ""
torch.manual_seed(args.seed)
env = create_atari_env(None)
shared_model = ActorCritic(env.observation_space.shape[0], env.action_space)
shared_model.share_memory()

if args.no_shared:
    optimizer = None
else:
    optimizer = my_optim.SharedAdam(shared_model.parameters(), lr=args.lr)
    optimizer.share_memory()

processes = []

counter = mp.Value('i', 0)
lock = mp.Lock()

p = mp.Process(target=test, args=(args.num_processes, args, shared_model, counter))
p.start()
processes.append(p)

for rank in range(0, args.num_processes):
    p = mp.Process(target=train, args=(rank, args, shared_model, counter, lock, optimizer))
    p.start()
    processes.append(p)
for p in processes:
    p.join()

Time 00h 00m 00s, num steps 224, FPS 630, episode reward -2359.628501009234, episode length 100
Time 00h 01m 00s, num steps 25850, FPS 424, episode reward -2359.628501009234, episode length 100
Time 00h 02m 01s, num steps 51037, FPS 420, episode reward -2359.628501009234, episode length 100
Time 00h 03m 01s, num steps 76405, FPS 420, episode reward -2359.628501009234, episode length 100
Time 00h 04m 02s, num steps 101777, FPS 420, episode reward -2382.0316954362584, episode length 101
Time 00h 05m 02s, num steps 127235, FPS 420, episode reward -2359.628501009234, episode length 100
Time 00h 06m 03s, num steps 152856, FPS 421, episode reward -2496.3258534164647, episode length 106
Time 00h 07m 03s, num steps 178122, FPS 420, episode reward -2359.628501009234, episode length 100
Time 00h 08m 04s, num steps 203843, FPS 421, episode reward -2359.628501009234, episode length 100
Time 00h 09m 05s, num steps 229269, FPS 421, episode reward -2359.628501009234, episode length 100
Time 00h 10m 0

  action = 0.01 * action/np.linalg.norm(action, ord = 2)


Time 00h 43m 23s, num steps 1075207, FPS 413, episode reward nan, episode length 125
Time 00h 44m 24s, num steps 1099516, FPS 413, episode reward -2686.5007690862344, episode length 114
Time 00h 45m 24s, num steps 1123683, FPS 412, episode reward nan, episode length 138
Time 00h 46m 25s, num steps 1148387, FPS 412, episode reward nan, episode length 143
Time 00h 47m 26s, num steps 1172846, FPS 412, episode reward -3091.4665125086394, episode length 129
Time 00h 48m 26s, num steps 1197230, FPS 412, episode reward -3091.4665125086394, episode length 129
Time 00h 49m 27s, num steps 1221576, FPS 412, episode reward -2952.1027149632137, episode length 124
Time 00h 50m 28s, num steps 1246289, FPS 412, episode reward -3476.8914957715156, episode length 144
Time 00h 51m 28s, num steps 1271088, FPS 411, episode reward -2711.4744990542754, episode length 115
Time 00h 52m 29s, num steps 1295368, FPS 411, episode reward nan, episode length 100
Time 00h 53m 30s, num steps 1319838, FPS 411, episode 

Time 02h 09m 14s, num steps 3156653, FPS 407, episode reward -2359.628501009234, episode length 100
Time 02h 10m 15s, num steps 3181142, FPS 407, episode reward nan, episode length 103
Time 02h 11m 16s, num steps 3205676, FPS 407, episode reward -3277.171001143663, episode length 136
Time 02h 12m 16s, num steps 3230384, FPS 407, episode reward -2841.1340885832574, episode length 120
Time 02h 13m 17s, num steps 3254987, FPS 407, episode reward -3815.950733001962, episode length 159
Time 02h 14m 18s, num steps 3279442, FPS 407, episode reward -2895.9573846533494, episode length 122
Time 02h 15m 19s, num steps 3304002, FPS 407, episode reward -2359.628501009234, episode length 100
Time 02h 16m 19s, num steps 3328675, FPS 407, episode reward -2359.628501009234, episode length 100
Time 02h 17m 20s, num steps 3352890, FPS 407, episode reward -2359.628501009234, episode length 100
Time 02h 18m 20s, num steps 3377771, FPS 407, episode reward -2841.1340885832574, episode length 120
Time 02h 19m

Time 03h 34m 06s, num steps 5200218, FPS 405, episode reward nan, episode length 100
Time 03h 35m 06s, num steps 5225776, FPS 405, episode reward -2359.628501009234, episode length 100
Time 03h 36m 08s, num steps 5251908, FPS 405, episode reward -5426.763224821954, episode length 346
Time 03h 37m 08s, num steps 5277350, FPS 405, episode reward nan, episode length 100
Time 03h 38m 09s, num steps 5302850, FPS 405, episode reward -2496.3258534164647, episode length 106
Time 03h 39m 09s, num steps 5328409, FPS 405, episode reward nan, episode length 104
Time 03h 40m 10s, num steps 5353982, FPS 405, episode reward -2868.348401136659, episode length 121
Time 03h 41m 10s, num steps 5379583, FPS 405, episode reward -2762.40393871813, episode length 117
Time 03h 42m 11s, num steps 5404794, FPS 405, episode reward -2736.7841642573508, episode length 116
Time 03h 43m 12s, num steps 5430318, FPS 405, episode reward nan, episode length 100
Time 03h 44m 12s, num steps 5455941, FPS 406, episode rewar

Time 05h 01m 59s, num steps 7440730, FPS 411, episode reward -2359.628501009234, episode length 100
Time 05h 02m 59s, num steps 7466456, FPS 411, episode reward -2359.628501009234, episode length 100
Time 05h 04m 00s, num steps 7492435, FPS 411, episode reward -4005.997723275353, episode length 167
Time 05h 05m 01s, num steps 7518469, FPS 411, episode reward nan, episode length 100
Time 05h 06m 01s, num steps 7544057, FPS 411, episode reward nan, episode length 102
Time 05h 07m 02s, num steps 7569906, FPS 411, episode reward nan, episode length 103
Time 05h 08m 02s, num steps 7595928, FPS 411, episode reward -2473.2160182689036, episode length 105
Time 05h 09m 03s, num steps 7621593, FPS 411, episode reward nan, episode length 100
Time 05h 10m 03s, num steps 7646953, FPS 411, episode reward nan, episode length 100
Time 05h 11m 04s, num steps 7672882, FPS 411, episode reward nan, episode length 102
Time 05h 12m 04s, num steps 7699031, FPS 411, episode reward nan, episode length 100
Time

Time 06h 27m 50s, num steps 9639883, FPS 414, episode reward -2359.628501009234, episode length 100
Time 06h 28m 51s, num steps 9665131, FPS 414, episode reward -3658.7180934576277, episode length 152
Time 06h 29m 52s, num steps 9691405, FPS 414, episode reward nan, episode length 114
Time 06h 30m 53s, num steps 9717515, FPS 414, episode reward -3091.4665125086394, episode length 129
Time 06h 31m 53s, num steps 9743625, FPS 414, episode reward nan, episode length 106
Time 06h 32m 54s, num steps 9769593, FPS 414, episode reward nan, episode length 119
Time 06h 33m 54s, num steps 9795525, FPS 414, episode reward -2496.3258534164647, episode length 106
Time 06h 34m 55s, num steps 9821342, FPS 414, episode reward -2382.0316954362584, episode length 101
Time 06h 35m 56s, num steps 9847418, FPS 415, episode reward -4261.671250156531, episode length 177
Time 06h 36m 56s, num steps 9873078, FPS 415, episode reward -2359.628501009234, episode length 100
Time 06h 37m 57s, num steps 9899245, FPS 

Time 07h 52m 50s, num steps 11818518, FPS 417, episode reward -2359.628501009234, episode length 100
Time 07h 53m 51s, num steps 11844448, FPS 417, episode reward nan, episode length 131
Time 07h 54m 51s, num steps 11870105, FPS 417, episode reward -2359.628501009234, episode length 100
Time 07h 55m 52s, num steps 11896283, FPS 417, episode reward -2711.4744990542754, episode length 115
Time 07h 56m 52s, num steps 11922157, FPS 417, episode reward -2359.628501009234, episode length 100
Time 07h 57m 53s, num steps 11948480, FPS 417, episode reward -4604.927430982805, episode length 192
Time 07h 58m 54s, num steps 11974643, FPS 417, episode reward -4627.5380130946305, episode length 193
Time 07h 59m 55s, num steps 12000981, FPS 417, episode reward -2404.58579547247, episode length 102
Time 08h 00m 55s, num steps 12027161, FPS 417, episode reward -2736.7841642573508, episode length 116
Time 08h 01m 56s, num steps 12052909, FPS 417, episode reward -2762.40393871813, episode length 117
Time

Time 09h 18m 47s, num steps 14017397, FPS 418, episode reward -2895.9573846533494, episode length 122
Time 09h 19m 48s, num steps 14043074, FPS 418, episode reward -2359.628501009234, episode length 100
Time 09h 20m 48s, num steps 14068967, FPS 418, episode reward -2952.1027149632137, episode length 124
Time 09h 21m 49s, num steps 14094670, FPS 418, episode reward -2404.58579547247, episode length 102
Time 09h 22m 51s, num steps 14121217, FPS 418, episode reward -5433.230187636285, episode length 385
Time 09h 23m 51s, num steps 14147353, FPS 418, episode reward -3592.7193457545322, episode length 149
Time 09h 24m 52s, num steps 14172486, FPS 418, episode reward -2382.0316954362584, episode length 101
Time 09h 25m 52s, num steps 14198403, FPS 418, episode reward -2359.628501009234, episode length 100
Time 09h 26m 53s, num steps 14224471, FPS 418, episode reward -3570.3574395842074, episode length 148
Time 09h 27m 53s, num steps 14250289, FPS 418, episode reward nan, episode length 116
T

Time 10h 43m 39s, num steps 16191061, FPS 419, episode reward nan, episode length 100
Time 10h 44m 40s, num steps 16217033, FPS 419, episode reward -3277.171001143663, episode length 136
Time 10h 45m 40s, num steps 16242829, FPS 419, episode reward nan, episode length 100
Time 10h 46m 41s, num steps 16268333, FPS 419, episode reward nan, episode length 100
Time 10h 47m 41s, num steps 16294283, FPS 419, episode reward nan, episode length 100
Time 10h 48m 42s, num steps 16320133, FPS 419, episode reward nan, episode length 100
Time 10h 49m 42s, num steps 16346298, FPS 419, episode reward nan, episode length 101
Time 10h 50m 43s, num steps 16372110, FPS 419, episode reward -3036.374576158774, episode length 127
Time 10h 51m 44s, num steps 16398093, FPS 419, episode reward -3064.0276716425524, episode length 128
Time 10h 52m 44s, num steps 16424184, FPS 419, episode reward nan, episode length 100
Time 10h 53m 44s, num steps 16450335, FPS 419, episode reward -2359.628501009234, episode leng

Time 12h 09m 36s, num steps 18393219, FPS 420, episode reward -2895.9573846533494, episode length 122
Time 12h 10m 37s, num steps 18419215, FPS 420, episode reward -4400.235622540142, episode length 183
Time 12h 11m 37s, num steps 18445078, FPS 420, episode reward -2895.9573846533494, episode length 122
Time 12h 12m 40s, num steps 18471248, FPS 420, episode reward -5450.9959728535705, episode length 492
Time 12h 13m 42s, num steps 18497611, FPS 420, episode reward -5439.539197188287, episode length 423
Time 12h 14m 42s, num steps 18523879, FPS 420, episode reward -2736.7841642573508, episode length 116
Time 12h 15m 43s, num steps 18549753, FPS 420, episode reward -2359.628501009234, episode length 100
Time 12h 16m 43s, num steps 18575875, FPS 420, episode reward -2359.628501009234, episode length 100
Time 12h 17m 44s, num steps 18601873, FPS 420, episode reward -2359.628501009234, episode length 100
Time 12h 18m 44s, num steps 18628214, FPS 420, episode reward -2566.3532063447396, epis

Time 13h 34m 38s, num steps 20617305, FPS 422, episode reward -2566.3532063447396, episode length 109
Time 13h 35m 38s, num steps 20644494, FPS 422, episode reward -2359.628501009234, episode length 100
Time 13h 36m 39s, num steps 20671197, FPS 422, episode reward -2359.628501009234, episode length 100
Time 13h 37m 39s, num steps 20697586, FPS 422, episode reward nan, episode length 103
Time 13h 38m 40s, num steps 20724658, FPS 422, episode reward nan, episode length 102
Time 13h 39m 40s, num steps 20751172, FPS 422, episode reward -2359.628501009234, episode length 100
Time 13h 40m 41s, num steps 20777247, FPS 422, episode reward nan, episode length 104
Time 13h 41m 41s, num steps 20803202, FPS 422, episode reward nan, episode length 106
Time 13h 42m 42s, num steps 20829495, FPS 422, episode reward -4334.75905684863, episode length 180
Time 13h 43m 43s, num steps 20855615, FPS 422, episode reward -3118.7238517477576, episode length 130
Time 13h 44m 43s, num steps 20881483, FPS 422, ep

Time 15h 00m 44s, num steps 22820533, FPS 422, episode reward -5440.3694145497375, episode length 428
Time 15h 01m 45s, num steps 22846608, FPS 422, episode reward nan, episode length 122
Time 15h 02m 45s, num steps 22872939, FPS 422, episode reward -2542.8876875127985, episode length 108
Time 15h 03m 46s, num steps 22898702, FPS 422, episode reward -2519.5420729605826, episode length 107
Time 15h 04m 47s, num steps 22924460, FPS 422, episode reward -3302.5937644912797, episode length 137
Time 15h 05m 48s, num steps 22950822, FPS 422, episode reward -5426.597539168268, episode length 345
Time 15h 06m 49s, num steps 22976311, FPS 422, episode reward nan, episode length 126
Time 15h 07m 50s, num steps 23002163, FPS 422, episode reward -3932.181443029756, episode length 164
Time 15h 08m 51s, num steps 23028233, FPS 422, episode reward -2473.2160182689036, episode length 105
Time 15h 09m 51s, num steps 23053732, FPS 422, episode reward -2613.7270159203285, episode length 111
Time 15h 10m 5

Time 16h 27m 53s, num steps 25058140, FPS 423, episode reward -3199.2425101473264, episode length 133
Time 16h 28m 55s, num steps 25084415, FPS 423, episode reward -5426.928937178522, episode length 347
Time 16h 29m 55s, num steps 25110725, FPS 423, episode reward -2359.628501009234, episode length 100
Time 16h 30m 56s, num steps 25136738, FPS 423, episode reward -2359.628501009234, episode length 100
Time 16h 31m 56s, num steps 25162637, FPS 423, episode reward nan, episode length 125
Time 16h 32m 58s, num steps 25189168, FPS 423, episode reward -5428.918263655572, episode length 359
Time 16h 34m 00s, num steps 25215620, FPS 423, episode reward -5427.923585158258, episode length 353
Time 16h 35m 00s, num steps 25242025, FPS 423, episode reward -2762.40393871813, episode length 117
Time 16h 36m 01s, num steps 25267990, FPS 423, episode reward -2359.628501009234, episode length 100
Time 16h 37m 02s, num steps 25294717, FPS 423, episode reward -5427.260430556207, episode length 349
Time 

Time 17h 55m 12s, num steps 27290605, FPS 423, episode reward nan, episode length 101
Time 17h 56m 13s, num steps 27316729, FPS 423, episode reward nan, episode length 276
Time 17h 57m 14s, num steps 27342610, FPS 423, episode reward -3036.374576158774, episode length 127
Time 17h 58m 15s, num steps 27369157, FPS 423, episode reward -5434.0601608571105, episode length 390
Time 17h 59m 16s, num steps 27394505, FPS 423, episode reward -2359.628501009234, episode length 100
Time 18h 00m 17s, num steps 27420444, FPS 423, episode reward -5414.774192076593, episode length 277
Time 18h 01m 18s, num steps 27446067, FPS 423, episode reward nan, episode length 105
Time 18h 02m 18s, num steps 27471940, FPS 423, episode reward -2359.628501009234, episode length 100
Time 18h 03m 19s, num steps 27498129, FPS 423, episode reward nan, episode length 113
Time 18h 04m 19s, num steps 27523843, FPS 423, episode reward -2359.628501009234, episode length 100
Time 18h 05m 20s, num steps 27549573, FPS 423, ep

Time 19h 22m 17s, num steps 29515941, FPS 423, episode reward -2359.628501009234, episode length 100
Time 19h 23m 17s, num steps 29542141, FPS 423, episode reward -2566.3532063447396, episode length 109
Time 19h 24m 19s, num steps 29568307, FPS 423, episode reward -5425.934828978448, episode length 341
Time 19h 25m 21s, num steps 29594366, FPS 423, episode reward -5437.546712141901, episode length 411
Time 19h 26m 21s, num steps 29620252, FPS 423, episode reward -2359.628501009234, episode length 100
Time 19h 27m 22s, num steps 29646038, FPS 423, episode reward nan, episode length 100
Time 19h 28m 22s, num steps 29672155, FPS 423, episode reward -2359.628501009234, episode length 100
Time 19h 29m 22s, num steps 29697639, FPS 423, episode reward -2427.3117211560943, episode length 103
Time 19h 30m 23s, num steps 29723231, FPS 423, episode reward -2841.1340885832574, episode length 120
Time 19h 31m 23s, num steps 29749129, FPS 423, episode reward -2359.628501009234, episode length 100
Ti

Time 20h 48m 25s, num steps 31710997, FPS 423, episode reward -2359.628501009234, episode length 100
Time 20h 49m 27s, num steps 31737412, FPS 423, episode reward -5432.40038226214, episode length 380
Time 20h 50m 28s, num steps 31763758, FPS 423, episode reward -5432.40038226214, episode length 380
Time 20h 51m 30s, num steps 31790198, FPS 423, episode reward -5425.437464934259, episode length 338
Time 20h 52m 31s, num steps 31816622, FPS 423, episode reward -5432.234442931085, episode length 379
Time 20h 53m 33s, num steps 31843264, FPS 423, episode reward -5426.431864958673, episode length 344
Time 20h 54m 34s, num steps 31869343, FPS 423, episode reward -2382.0316954362584, episode length 101
Time 20h 55m 34s, num steps 31895203, FPS 423, episode reward nan, episode length 104
Time 20h 56m 36s, num steps 31921881, FPS 423, episode reward -5427.260430556207, episode length 349
Time 20h 57m 37s, num steps 31948521, FPS 423, episode reward -5427.426207762628, episode length 350
Time 2

Time 22h 13m 49s, num steps 33891629, FPS 423, episode reward -5430.078337889581, episode length 366
Time 22h 14m 49s, num steps 33917617, FPS 423, episode reward nan, episode length 104
Time 22h 15m 50s, num steps 33943071, FPS 423, episode reward -2788.274377651493, episode length 118
Time 22h 16m 50s, num steps 33968966, FPS 423, episode reward -2359.628501009234, episode length 100
Time 22h 17m 51s, num steps 33994791, FPS 423, episode reward -3251.518648333766, episode length 135
Time 22h 18m 51s, num steps 34020646, FPS 424, episode reward -2359.628501009234, episode length 100
Time 22h 19m 52s, num steps 34046471, FPS 424, episode reward -2359.628501009234, episode length 100
Time 22h 20m 52s, num steps 34072399, FPS 424, episode reward -3199.2425101473264, episode length 133
Time 22h 21m 54s, num steps 34098305, FPS 424, episode reward -5440.03732417193, episode length 426
Time 22h 22m 55s, num steps 34123752, FPS 423, episode reward -4081.8665172395836, episode length 170
Time

Time 23h 37m 51s, num steps 36033911, FPS 424, episode reward -3353.24075824756, episode length 139
Time 23h 38m 52s, num steps 36059479, FPS 424, episode reward -2359.628501009234, episode length 100
Time 23h 39m 53s, num steps 36085305, FPS 424, episode reward nan, episode length 282
Time 23h 40m 53s, num steps 36111338, FPS 424, episode reward -2359.628501009234, episode length 100
Time 23h 41m 54s, num steps 36137407, FPS 424, episode reward -2359.628501009234, episode length 100
Time 23h 42m 55s, num steps 36163418, FPS 424, episode reward -2359.628501009234, episode length 100
Time 23h 43m 55s, num steps 36188777, FPS 424, episode reward -2359.628501009234, episode length 100
Time 23h 44m 56s, num steps 36214587, FPS 424, episode reward -3064.0276716425524, episode length 128
Time 23h 45m 56s, num steps 36240252, FPS 424, episode reward nan, episode length 130
Time 23h 46m 57s, num steps 36265940, FPS 424, episode reward -2359.628501009234, episode length 100
Time 23h 47m 58s, nu

Time 01h 02m 53s, num steps 38196088, FPS 424, episode reward -2359.628501009234, episode length 100
Time 01h 03m 53s, num steps 38221743, FPS 424, episode reward -2359.628501009234, episode length 100
Time 01h 04m 55s, num steps 38247457, FPS 424, episode reward -5436.882565718561, episode length 407
Time 01h 05m 56s, num steps 38273167, FPS 424, episode reward -4558.935655233077, episode length 190
Time 01h 06m 56s, num steps 38298707, FPS 424, episode reward nan, episode length 100
Time 01h 07m 57s, num steps 38324652, FPS 424, episode reward nan, episode length 100
Time 01h 08m 57s, num steps 38350559, FPS 424, episode reward nan, episode length 100
Time 01h 09m 58s, num steps 38376400, FPS 424, episode reward -2359.628501009234, episode length 100
Time 01h 10m 59s, num steps 38402355, FPS 424, episode reward -3932.181443029756, episode length 164
Time 01h 12m 00s, num steps 38428926, FPS 424, episode reward -5428.089379530817, episode length 354
Time 01h 13m 01s, num steps 3845509

Time 02h 28m 58s, num steps 40394908, FPS 424, episode reward -2359.628501009234, episode length 100
Time 02h 29m 59s, num steps 40420841, FPS 424, episode reward -4604.927430982805, episode length 192
Time 02h 30m 59s, num steps 40446688, FPS 424, episode reward -2359.628501009234, episode length 100
Time 02h 32m 00s, num steps 40472558, FPS 424, episode reward -2450.2062561012713, episode length 104
Time 02h 33m 02s, num steps 40498751, FPS 424, episode reward -5432.234442931085, episode length 379
Time 02h 34m 02s, num steps 40524460, FPS 424, episode reward -2359.628501009234, episode length 100
Time 02h 35m 04s, num steps 40550545, FPS 424, episode reward -5430.741503935724, episode length 370
Time 02h 36m 05s, num steps 40576531, FPS 424, episode reward -5431.239041548639, episode length 373
Time 02h 37m 06s, num steps 40602311, FPS 424, episode reward -2980.3820980265286, episode length 125
Time 02h 38m 07s, num steps 40628367, FPS 424, episode reward nan, episode length 149
Tim

Time 03h 54m 15s, num steps 42538014, FPS 423, episode reward -5432.898242216974, episode length 383
Time 03h 55m 17s, num steps 42563985, FPS 423, episode reward -5431.404910307794, episode length 374
Time 03h 56m 19s, num steps 42589933, FPS 423, episode reward -5426.26620219317, episode length 343
Time 03h 57m 19s, num steps 42615829, FPS 423, episode reward -2519.5420729605826, episode length 107
Time 03h 58m 20s, num steps 42641561, FPS 423, episode reward -2427.3117211560943, episode length 103
Time 03h 59m 20s, num steps 42667235, FPS 423, episode reward -2404.58579547247, episode length 102
Time 04h 00m 21s, num steps 42692492, FPS 423, episode reward -2589.9653536757373, episode length 110
Time 04h 01m 21s, num steps 42718142, FPS 423, episode reward -3277.171001143663, episode length 136
Time 04h 02m 22s, num steps 42743477, FPS 423, episode reward -2359.628501009234, episode length 100
Time 04h 03m 23s, num steps 42769586, FPS 423, episode reward -5429.415402632623, episode 

Time 05h 21m 28s, num steps 44752644, FPS 423, episode reward nan, episode length 101
Time 05h 22m 29s, num steps 44778902, FPS 423, episode reward -5426.100529890924, episode length 342
Time 05h 23m 31s, num steps 44805166, FPS 423, episode reward -5425.105567198663, episode length 336
Time 05h 24m 32s, num steps 44830929, FPS 423, episode reward nan, episode length 102
Time 05h 25m 32s, num steps 44856169, FPS 423, episode reward nan, episode length 102
Time 05h 26m 33s, num steps 44881859, FPS 423, episode reward -2359.628501009234, episode length 100
Time 05h 27m 35s, num steps 44907950, FPS 423, episode reward -5435.886380415826, episode length 401
Time 05h 28m 35s, num steps 44933420, FPS 423, episode reward nan, episode length 106
Time 05h 29m 37s, num steps 44959442, FPS 423, episode reward -5424.607289534479, episode length 333
Time 05h 30m 38s, num steps 44985247, FPS 423, episode reward -5248.014735820421, episode length 224
Time 05h 31m 39s, num steps 45011201, FPS 423, epi

Time 06h 48m 45s, num steps 46974167, FPS 423, episode reward nan, episode length 100
Time 06h 49m 46s, num steps 46999656, FPS 423, episode reward -2359.628501009234, episode length 100
Time 06h 50m 46s, num steps 47025225, FPS 423, episode reward -2382.0316954362584, episode length 101
Time 06h 51m 47s, num steps 47050823, FPS 423, episode reward -2359.628501009234, episode length 100
Time 06h 52m 48s, num steps 47076904, FPS 423, episode reward nan, episode length 190
Time 06h 53m 49s, num steps 47102643, FPS 423, episode reward -3747.4030614471553, episode length 156
Time 06h 54m 49s, num steps 47128530, FPS 423, episode reward nan, episode length 119
Time 06h 55m 50s, num steps 47154391, FPS 423, episode reward -2868.348401136659, episode length 121
Time 06h 56m 50s, num steps 47180079, FPS 423, episode reward -2404.58579547247, episode length 102
Time 06h 57m 51s, num steps 47205588, FPS 423, episode reward nan, episode length 100
Time 06h 58m 52s, num steps 47231762, FPS 423, ep

Time 08h 14m 08s, num steps 49150098, FPS 424, episode reward -5423.444638472467, episode length 326
Time 08h 15m 10s, num steps 49176038, FPS 424, episode reward -5444.354397993951, episode length 452
Time 08h 16m 11s, num steps 49201741, FPS 424, episode reward -2359.628501009234, episode length 100
Time 08h 17m 11s, num steps 49227170, FPS 424, episode reward -2359.628501009234, episode length 100
Time 08h 18m 13s, num steps 49253110, FPS 424, episode reward -5431.239041548639, episode length 373
Time 08h 19m 14s, num steps 49278532, FPS 424, episode reward -2359.628501009234, episode length 100
Time 08h 20m 14s, num steps 49304391, FPS 424, episode reward -2450.2062561012713, episode length 104
Time 08h 21m 15s, num steps 49330139, FPS 424, episode reward nan, episode length 317
Time 08h 22m 18s, num steps 49356632, FPS 424, episode reward -5447.675189238458, episode length 472
Time 08h 23m 20s, num steps 49383038, FPS 424, episode reward -5454.316796523004, episode length 512
Time

Time 09h 39m 34s, num steps 51319018, FPS 424, episode reward -5428.4209644612365, episode length 356
Time 09h 40m 36s, num steps 51345146, FPS 424, episode reward -5465.2753631886535, episode length 578
Time 09h 41m 37s, num steps 51370474, FPS 424, episode reward -2359.628501009234, episode length 100
Time 09h 42m 40s, num steps 51396855, FPS 424, episode reward -5465.607440215021, episode length 580
Time 09h 43m 42s, num steps 51422868, FPS 424, episode reward -5427.923585158258, episode length 353
Time 09h 44m 44s, num steps 51449303, FPS 424, episode reward -5465.441401701837, episode length 579
Time 09h 45m 45s, num steps 51475387, FPS 424, episode reward nan, episode length 101
Time 09h 46m 45s, num steps 51500792, FPS 424, episode reward nan, episode length 101
Time 09h 47m 46s, num steps 51526771, FPS 424, episode reward -2359.628501009234, episode length 100
Time 09h 48m 47s, num steps 51553024, FPS 424, episode reward -5430.575690489679, episode length 369
Time 09h 49m 48s, 

Time 11h 05m 08s, num steps 53493476, FPS 424, episode reward -5431.073182326227, episode length 372
Time 11h 06m 09s, num steps 53518790, FPS 424, episode reward nan, episode length 100
Time 11h 07m 10s, num steps 53544448, FPS 424, episode reward nan, episode length 101
Time 11h 08m 10s, num steps 53570209, FPS 424, episode reward -3636.816938702446, episode length 151
Time 11h 09m 12s, num steps 53595967, FPS 424, episode reward -5432.234442931085, episode length 379
Time 11h 10m 14s, num steps 53621967, FPS 424, episode reward -5432.566329222589, episode length 381
Time 11h 11m 14s, num steps 53647466, FPS 424, episode reward -2473.2160182689036, episode length 105
Time 11h 12m 17s, num steps 53674174, FPS 424, episode reward nan, episode length 551
Time 11h 13m 18s, num steps 53700112, FPS 424, episode reward -3614.8425924234793, episode length 150
Time 11h 14m 20s, num steps 53726245, FPS 424, episode reward nan, episode length 361
Time 11h 15m 20s, num steps 53751883, FPS 424, e

Time 12h 30m 50s, num steps 55682924, FPS 424, episode reward -5466.603678923517, episode length 586
Time 12h 31m 51s, num steps 55708715, FPS 424, episode reward -3145.799187608007, episode length 131
Time 12h 32m 52s, num steps 55735542, FPS 424, episode reward -3064.0276716425524, episode length 128
Time 12h 33m 53s, num steps 55762157, FPS 424, episode reward -5426.26620219317, episode length 343
Time 12h 34m 55s, num steps 55789406, FPS 424, episode reward -5426.431864958673, episode length 344
Time 12h 35m 55s, num steps 55815574, FPS 424, episode reward -2359.628501009234, episode length 100
Time 12h 36m 57s, num steps 55842370, FPS 424, episode reward -5426.597539168268, episode length 345
Time 12h 37m 57s, num steps 55868869, FPS 424, episode reward nan, episode length 100
Time 12h 38m 59s, num steps 55895839, FPS 424, episode reward -5428.089379530817, episode length 354
Time 12h 40m 00s, num steps 55922884, FPS 424, episode reward -5430.741503935724, episode length 370
Time 

Time 13h 58m 27s, num steps 57921998, FPS 424, episode reward nan, episode length 101
Time 13h 59m 27s, num steps 57947955, FPS 424, episode reward nan, episode length 102
Time 14h 00m 29s, num steps 57974137, FPS 424, episode reward -5427.426207762628, episode length 350
Time 14h 01m 29s, num steps 57999865, FPS 424, episode reward nan, episode length 102
Time 14h 02m 31s, num steps 58025904, FPS 424, episode reward -5426.928937178522, episode length 347
Time 14h 03m 33s, num steps 58051623, FPS 424, episode reward -5426.928937178522, episode length 347
Time 14h 04m 34s, num steps 58077831, FPS 424, episode reward -5426.763224821954, episode length 346
Time 14h 05m 36s, num steps 58103803, FPS 424, episode reward -5426.763224821954, episode length 346
Time 14h 06m 36s, num steps 58129155, FPS 424, episode reward nan, episode length 101
Time 14h 07m 37s, num steps 58154744, FPS 424, episode reward nan, episode length 101
Time 14h 08m 37s, num steps 58180306, FPS 424, episode reward -31

Time 15h 26m 03s, num steps 60151366, FPS 424, episode reward nan, episode length 102
Time 15h 27m 03s, num steps 60177909, FPS 424, episode reward nan, episode length 103
Time 15h 28m 05s, num steps 60204622, FPS 424, episode reward -5430.078337889581, episode length 366
Time 15h 29m 06s, num steps 60231357, FPS 424, episode reward nan, episode length 150
Time 15h 30m 06s, num steps 60257749, FPS 424, episode reward nan, episode length 101
Time 15h 31m 07s, num steps 60284376, FPS 424, episode reward -2359.628501009234, episode length 100
Time 15h 32m 08s, num steps 60310595, FPS 424, episode reward -5430.409894209772, episode length 368
Time 15h 33m 09s, num steps 60336150, FPS 424, episode reward nan, episode length 102
Time 15h 34m 10s, num steps 60361835, FPS 424, episode reward -3793.010064300342, episode length 158
Time 15h 35m 11s, num steps 60387662, FPS 424, episode reward -5436.882565718561, episode length 407
Time 15h 36m 12s, num steps 60413345, FPS 424, episode reward -40

Time 16h 52m 29s, num steps 62347551, FPS 424, episode reward nan, episode length 353
Time 16h 53m 30s, num steps 62373408, FPS 424, episode reward nan, episode length 130
Time 16h 54m 31s, num steps 62399020, FPS 424, episode reward nan, episode length 196
Time 16h 55m 32s, num steps 62424859, FPS 424, episode reward nan, episode length 355
Time 16h 56m 34s, num steps 62450496, FPS 424, episode reward -5429.083985548883, episode length 360
Time 16h 57m 34s, num steps 62476482, FPS 424, episode reward -3378.4052898361065, episode length 140
Time 16h 58m 36s, num steps 62503023, FPS 424, episode reward -5428.255171996027, episode length 355
Time 16h 59m 38s, num steps 62529989, FPS 424, episode reward -5431.9025966939025, episode length 377
Time 17h 00m 38s, num steps 62556430, FPS 424, episode reward nan, episode length 118
Time 17h 01m 39s, num steps 62583039, FPS 424, episode reward nan, episode length 134
Time 17h 02m 40s, num steps 62609775, FPS 424, episode reward -3091.4665125086

Time 18h 20m 01s, num steps 64581108, FPS 424, episode reward -3327.9670707656865, episode length 138
Time 18h 21m 01s, num steps 64606577, FPS 424, episode reward -3251.518648333766, episode length 135
Time 18h 22m 02s, num steps 64632041, FPS 424, episode reward -4261.671250156531, episode length 177
Time 18h 23m 05s, num steps 64658501, FPS 424, episode reward -5459.297997694879, episode length 542
Time 18h 24m 07s, num steps 64684616, FPS 424, episode reward -5446.844992857843, episode length 467
Time 18h 25m 08s, num steps 64710270, FPS 424, episode reward -3353.24075824756, episode length 139
Time 18h 26m 08s, num steps 64735667, FPS 424, episode reward nan, episode length 132
Time 18h 27m 09s, num steps 64761466, FPS 424, episode reward nan, episode length 132
Time 18h 28m 11s, num steps 64787600, FPS 424, episode reward -5433.230187636285, episode length 385
Time 18h 29m 13s, num steps 64813547, FPS 424, episode reward -5446.014798384576, episode length 462
Time 18h 30m 14s, nu

Time 19h 45m 49s, num steps 66746644, FPS 424, episode reward -5446.346879225641, episode length 464
Time 19h 46m 49s, num steps 66772407, FPS 424, episode reward -2589.9653536757373, episode length 110
Time 19h 47m 50s, num steps 66797731, FPS 424, episode reward -3145.799187608007, episode length 131
Time 19h 48m 53s, num steps 66823845, FPS 424, episode reward -5447.343110304742, episode length 470
Time 19h 49m 54s, num steps 66848184, FPS 424, episode reward nan, episode length 106
Time 19h 50m 55s, num steps 66873538, FPS 424, episode reward -5430.575690489679, episode length 369
Time 19h 51m 56s, num steps 66898591, FPS 424, episode reward -3225.541353650318, episode length 134
Time 19h 52m 58s, num steps 66924337, FPS 424, episode reward -5437.214633208185, episode length 409
Time 19h 54m 00s, num steps 66949916, FPS 424, episode reward -3199.2425101473264, episode length 133
Time 19h 55m 02s, num steps 66975477, FPS 424, episode reward -5430.575690489679, episode length 369
Tim

Time 21h 13m 16s, num steps 68868085, FPS 423, episode reward -5430.907334547906, episode length 371
Time 21h 14m 17s, num steps 68893614, FPS 423, episode reward -2736.7841642573508, episode length 116
Time 21h 15m 17s, num steps 68919561, FPS 423, episode reward nan, episode length 126
Time 21h 16m 19s, num steps 68945934, FPS 423, episode reward -5431.404910307794, episode length 374
Time 21h 17m 21s, num steps 68972517, FPS 423, episode reward -5451.9921963032775, episode length 498
Time 21h 18m 22s, num steps 68997907, FPS 423, episode reward -3172.6484010889517, episode length 132
Time 21h 19m 22s, num steps 69023521, FPS 423, episode reward -3172.6484010889517, episode length 132
Time 21h 20m 24s, num steps 69049344, FPS 423, episode reward -5434.558196288019, episode length 393
Time 21h 21m 26s, num steps 69075187, FPS 423, episode reward -5431.9025966939025, episode length 377
Time 21h 22m 28s, num steps 69101266, FPS 423, episode reward -5431.570790511041, episode length 375


Time 22h 39m 51s, num steps 71066195, FPS 423, episode reward -3172.6484010889517, episode length 132
Time 22h 40m 52s, num steps 71092145, FPS 423, episode reward nan, episode length 102
Time 22h 41m 52s, num steps 71118210, FPS 423, episode reward -3145.799187608007, episode length 131
Time 22h 42m 53s, num steps 71144056, FPS 423, episode reward -3199.2425101473264, episode length 133
Time 22h 43m 54s, num steps 71170488, FPS 423, episode reward -4378.677792888102, episode length 182
Time 22h 44m 56s, num steps 71196892, FPS 423, episode reward -5425.769086104303, episode length 340
Time 22h 45m 56s, num steps 71223050, FPS 423, episode reward -4334.75905684863, episode length 180
Time 22h 46m 57s, num steps 71248729, FPS 423, episode reward nan, episode length 113
Time 22h 47m 59s, num steps 71274953, FPS 423, episode reward -5446.844992857843, episode length 467
Time 22h 49m 00s, num steps 71300790, FPS 423, episode reward nan, episode length 101
Time 22h 50m 02s, num steps 713269

Time 00h 03m 18s, num steps 73187561, FPS 423, episode reward -4357.063402251657, episode length 181
Time 00h 04m 20s, num steps 73213623, FPS 423, episode reward -5434.0601608571105, episode length 390
Time 00h 05m 21s, num steps 73239499, FPS 423, episode reward -5425.105567198663, episode length 336
Time 00h 06m 22s, num steps 73265109, FPS 423, episode reward -2427.3117211560943, episode length 103
Time 00h 07m 23s, num steps 73291171, FPS 423, episode reward -5427.923585158258, episode length 353
Time 00h 08m 24s, num steps 73316787, FPS 423, episode reward -3118.7238517477576, episode length 130
Time 00h 09m 25s, num steps 73342285, FPS 423, episode reward -3064.0276716425524, episode length 128
Time 00h 10m 26s, num steps 73368571, FPS 423, episode reward -5425.105567198663, episode length 336
Time 00h 11m 28s, num steps 73394824, FPS 423, episode reward -5428.089379530817, episode length 354
Time 00h 12m 29s, num steps 73420574, FPS 423, episode reward -3091.4665125086394, epis

Time 01h 27m 11s, num steps 75322771, FPS 423, episode reward -2762.40393871813, episode length 117
Time 01h 28m 12s, num steps 75348634, FPS 423, episode reward -3327.9670707656865, episode length 138
Time 01h 29m 12s, num steps 75373916, FPS 423, episode reward -2661.9179260210253, episode length 113
Time 01h 30m 13s, num steps 75399809, FPS 423, episode reward -2519.5420729605826, episode length 107
Time 01h 31m 14s, num steps 75425992, FPS 423, episode reward -5426.928937178522, episode length 347
Time 01h 32m 15s, num steps 75451553, FPS 423, episode reward -3064.0276716425524, episode length 128
Time 01h 33m 16s, num steps 75477304, FPS 423, episode reward -3702.56880944921, episode length 154
Time 01h 34m 16s, num steps 75502719, FPS 423, episode reward -3327.9670707656865, episode length 138
Time 01h 35m 17s, num steps 75528429, FPS 423, episode reward -3277.171001143663, episode length 136
Time 01h 36m 18s, num steps 75553688, FPS 423, episode reward -3353.24075824756, episode

Time 02h 50m 42s, num steps 77446624, FPS 423, episode reward -3592.7193457545322, episode length 149
Time 02h 51m 43s, num steps 77472128, FPS 423, episode reward -3592.7193457545322, episode length 149
Time 02h 52m 44s, num steps 77497066, FPS 423, episode reward -5430.741503935724, episode length 370
Time 02h 53m 46s, num steps 77522027, FPS 423, episode reward -5447.509148817926, episode length 471
Time 02h 54m 49s, num steps 77547471, FPS 423, episode reward -5461.12441943255, episode length 553
Time 02h 55m 49s, num steps 77572048, FPS 423, episode reward -2637.681960530777, episode length 112
Time 02h 56m 52s, num steps 77597459, FPS 423, episode reward -5472.249087553888, episode length 620
Time 02h 57m 55s, num steps 77623458, FPS 423, episode reward -5473.74343417254, episode length 629
Time 02h 58m 57s, num steps 77649190, FPS 423, episode reward -5439.207110625177, episode length 421
Time 02h 59m 59s, num steps 77675080, FPS 423, episode reward -5431.073182326227, episode l

Time 04h 14m 31s, num steps 79551043, FPS 423, episode reward -2359.628501009234, episode length 100
Time 04h 15m 33s, num steps 79577144, FPS 423, episode reward -5430.078337889581, episode length 366
Time 04h 16m 33s, num steps 79602733, FPS 423, episode reward -2359.628501009234, episode length 100
Time 04h 17m 34s, num steps 79627958, FPS 423, episode reward -2980.3820980265286, episode length 125
Time 04h 18m 35s, num steps 79654233, FPS 423, episode reward -5430.575690489679, episode length 369
Time 04h 19m 37s, num steps 79680277, FPS 423, episode reward -5430.575690489679, episode length 369
Time 04h 20m 39s, num steps 79706377, FPS 423, episode reward -5430.078337889581, episode length 366
Time 04h 21m 41s, num steps 79732541, FPS 423, episode reward -5429.083985548883, episode length 360
Time 04h 22m 42s, num steps 79758197, FPS 423, episode reward -5426.928937178522, episode length 347
Time 04h 23m 44s, num steps 79784328, FPS 423, episode reward -5429.2496921834045, episode

Time 05h 38m 03s, num steps 81672269, FPS 423, episode reward -2519.5420729605826, episode length 107
Time 05h 39m 04s, num steps 81698313, FPS 423, episode reward -3118.7238517477576, episode length 130
Time 05h 40m 05s, num steps 81724339, FPS 423, episode reward -5436.882565718561, episode length 407
Time 05h 41m 06s, num steps 81749932, FPS 423, episode reward -2519.5420729605826, episode length 107
Time 05h 42m 06s, num steps 81775695, FPS 423, episode reward -2841.1340885832574, episode length 120
Time 05h 43m 09s, num steps 81801863, FPS 423, episode reward -5465.2753631886535, episode length 578
Time 05h 44m 09s, num steps 81827665, FPS 423, episode reward -2496.3258534164647, episode length 106
Time 05h 45m 10s, num steps 81853388, FPS 423, episode reward -2542.8876875127985, episode length 108
Time 05h 46m 12s, num steps 81879423, FPS 423, episode reward -5447.675189238458, episode length 472
Time 05h 47m 13s, num steps 81905003, FPS 423, episode reward -3547.6787915895197, e

Time 07h 03m 18s, num steps 83836487, FPS 423, episode reward -5450.33181307879, episode length 488
Time 07h 04m 20s, num steps 83862293, FPS 423, episode reward -5426.26620219317, episode length 343
Time 07h 05m 22s, num steps 83888690, FPS 423, episode reward -5427.426207762628, episode length 350
Time 07h 06m 23s, num steps 83914378, FPS 423, episode reward -5427.757786971002, episode length 352
Time 07h 07m 25s, num steps 83940845, FPS 423, episode reward -5429.2496921834045, episode length 361
Time 07h 08m 26s, num steps 83967064, FPS 423, episode reward -4081.8665172395836, episode length 170
Time 07h 09m 28s, num steps 83993353, FPS 423, episode reward -5430.409894209772, episode length 368
Time 07h 10m 28s, num steps 84019364, FPS 423, episode reward -2359.628501009234, episode length 100
Time 07h 11m 30s, num steps 84045939, FPS 423, episode reward -5430.907334547906, episode length 371
Time 07h 12m 31s, num steps 84072365, FPS 423, episode reward -3500.912640399992, episode l

Time 08h 26m 47s, num steps 85957895, FPS 423, episode reward -2359.628501009234, episode length 100
Time 08h 27m 48s, num steps 85983511, FPS 423, episode reward -2841.1340885832574, episode length 120
Time 08h 28m 49s, num steps 86009913, FPS 423, episode reward -5430.907334547906, episode length 371
Time 08h 29m 51s, num steps 86036003, FPS 423, episode reward nan, episode length 289
Time 08h 30m 53s, num steps 86061873, FPS 423, episode reward -5436.716529112726, episode length 406
Time 08h 31m 53s, num steps 86087542, FPS 423, episode reward -3172.6484010889517, episode length 132
Time 08h 32m 55s, num steps 86113332, FPS 423, episode reward -5430.907334547906, episode length 371
Time 08h 33m 55s, num steps 86139089, FPS 423, episode reward -2788.274377651493, episode length 118
Time 08h 34m 56s, num steps 86165028, FPS 423, episode reward -3199.2425101473264, episode length 133
Time 08h 35m 58s, num steps 86190963, FPS 423, episode reward -5426.597539168268, episode length 345
Ti

Time 09h 52m 16s, num steps 88130563, FPS 423, episode reward -5430.575690489679, episode length 369
Time 09h 53m 17s, num steps 88155829, FPS 423, episode reward -3302.5937644912797, episode length 137
Time 09h 54m 19s, num steps 88182092, FPS 423, episode reward -5452.324273329645, episode length 500
Time 09h 55m 20s, num steps 88207851, FPS 423, episode reward -3476.8914957715156, episode length 144
Time 09h 56m 21s, num steps 88233886, FPS 423, episode reward -5426.26620219317, episode length 343
Time 09h 57m 22s, num steps 88259514, FPS 423, episode reward -2589.9653536757373, episode length 110
Time 09h 58m 22s, num steps 88285382, FPS 423, episode reward -3570.3574395842074, episode length 148
Time 09h 59m 25s, num steps 88311878, FPS 423, episode reward -5448.173300963312, episode length 475
Time 10h 00m 25s, num steps 88337177, FPS 423, episode reward -2404.58579547247, episode length 102
Time 10h 01m 27s, num steps 88363190, FPS 423, episode reward nan, episode length 292
Tim

Time 11h 18m 45s, num steps 90323300, FPS 423, episode reward -5425.934828978448, episode length 341
Time 11h 19m 47s, num steps 90349384, FPS 423, episode reward -5425.934828978448, episode length 341
Time 11h 20m 48s, num steps 90375384, FPS 423, episode reward -5416.8986904439025, episode length 286
Time 11h 21m 50s, num steps 90401154, FPS 423, episode reward -5416.76401255694, episode length 285
Time 11h 22m 50s, num steps 90426898, FPS 423, episode reward -2359.628501009234, episode length 100
Time 11h 23m 51s, num steps 90452659, FPS 423, episode reward -2359.628501009234, episode length 100
Time 11h 24m 53s, num steps 90478671, FPS 423, episode reward -5423.279273253351, episode length 325
Time 11h 25m 53s, num steps 90504285, FPS 423, episode reward -2359.628501009234, episode length 100
Time 11h 26m 54s, num steps 90529983, FPS 423, episode reward -2359.628501009234, episode length 100
Time 11h 27m 54s, num steps 90555352, FPS 423, episode reward nan, episode length 130
Time 

Time 12h 47m 05s, num steps 92565256, FPS 423, episode reward -2542.8876875127985, episode length 108
Time 12h 48m 05s, num steps 92590633, FPS 423, episode reward -2382.0316954362584, episode length 101
Time 12h 49m 07s, num steps 92616978, FPS 423, episode reward -5443.690228682428, episode length 448
Time 12h 50m 08s, num steps 92642552, FPS 423, episode reward nan, episode length 103
Time 12h 51m 09s, num steps 92668215, FPS 423, episode reward nan, episode length 218
Time 12h 52m 09s, num steps 92694103, FPS 423, episode reward nan, episode length 102
Time 12h 53m 10s, num steps 92719656, FPS 423, episode reward nan, episode length 112
Time 12h 54m 10s, num steps 92745214, FPS 423, episode reward -3091.4665125086394, episode length 129
Time 12h 55m 11s, num steps 92770588, FPS 423, episode reward nan, episode length 103
Time 12h 56m 12s, num steps 92795983, FPS 423, episode reward nan, episode length 215
Time 12h 57m 12s, num steps 92821567, FPS 423, episode reward -2404.585795472

Time 14h 15m 27s, num steps 94808318, FPS 423, episode reward nan, episode length 106
Time 14h 16m 27s, num steps 94834057, FPS 423, episode reward nan, episode length 106
Time 14h 17m 28s, num steps 94859749, FPS 423, episode reward nan, episode length 106
Time 14h 18m 30s, num steps 94885667, FPS 423, episode reward -5438.542948943048, episode length 417
Time 14h 19m 31s, num steps 94911031, FPS 423, episode reward nan, episode length 106
Time 14h 20m 31s, num steps 94936944, FPS 423, episode reward -3428.074237175142, episode length 142
Time 14h 21m 32s, num steps 94962450, FPS 423, episode reward nan, episode length 104
Time 14h 22m 32s, num steps 94987898, FPS 423, episode reward nan, episode length 104
Time 14h 23m 33s, num steps 95014446, FPS 423, episode reward -2359.628501009234, episode length 100
Time 14h 24m 35s, num steps 95041529, FPS 423, episode reward -5438.708991270929, episode length 418
Time 14h 25m 35s, num steps 95067855, FPS 423, episode reward nan, episode lengt

Time 15h 44m 42s, num steps 97078584, FPS 423, episode reward -2359.628501009234, episode length 100
Time 15h 45m 42s, num steps 97103933, FPS 423, episode reward -2359.628501009234, episode length 100
Time 15h 46m 44s, num steps 97129861, FPS 423, episode reward -5427.923585158258, episode length 353
Time 15h 47m 45s, num steps 97155206, FPS 423, episode reward nan, episode length 297
Time 15h 48m 47s, num steps 97180847, FPS 423, episode reward nan, episode length 292
Time 15h 49m 48s, num steps 97206199, FPS 423, episode reward -4378.677792888102, episode length 182
Time 15h 50m 48s, num steps 97231680, FPS 423, episode reward -2359.628501009234, episode length 100
Time 15h 51m 49s, num steps 97257462, FPS 423, episode reward nan, episode length 294
Time 15h 52m 50s, num steps 97283093, FPS 423, episode reward -2359.628501009234, episode length 100
Time 15h 53m 51s, num steps 97308815, FPS 423, episode reward nan, episode length 194
Time 15h 54m 53s, num steps 97334574, FPS 423, epi

Time 17h 13m 30s, num steps 99343626, FPS 423, episode reward nan, episode length 295
Time 17h 14m 30s, num steps 99369627, FPS 423, episode reward -3008.4865257218016, episode length 126
Time 17h 15m 31s, num steps 99395405, FPS 423, episode reward -2841.1340885832574, episode length 120
Time 17h 16m 34s, num steps 99422236, FPS 423, episode reward -5479.056695204645, episode length 661
Time 17h 17m 34s, num steps 99448588, FPS 423, episode reward -2427.3117211560943, episode length 103
Time 17h 18m 36s, num steps 99474258, FPS 423, episode reward -5437.878792982965, episode length 413
Time 17h 19m 37s, num steps 99499687, FPS 423, episode reward nan, episode length 276
Time 17h 20m 39s, num steps 99525351, FPS 423, episode reward nan, episode length 304
Time 17h 21m 39s, num steps 99550878, FPS 423, episode reward nan, episode length 148
Time 17h 22m 40s, num steps 99576507, FPS 423, episode reward -4378.677792888102, episode length 182
Time 17h 23m 41s, num steps 99602331, FPS 423, 

Time 18h 40m 59s, num steps 101555799, FPS 423, episode reward nan, episode length 126
Time 18h 42m 00s, num steps 101582413, FPS 423, episode reward nan, episode length 129
Time 18h 43m 02s, num steps 101608633, FPS 423, episode reward nan, episode length 305
Time 18h 44m 03s, num steps 101635114, FPS 423, episode reward -5431.9025966939025, episode length 377
Time 18h 45m 05s, num steps 101661395, FPS 423, episode reward -5431.570790511041, episode length 375
Time 18h 46m 06s, num steps 101687761, FPS 423, episode reward nan, episode length 143
Time 18h 47m 07s, num steps 101713979, FPS 423, episode reward -3277.171001143663, episode length 136
Time 18h 48m 07s, num steps 101739824, FPS 423, episode reward -3145.799187608007, episode length 131
Time 18h 49m 09s, num steps 101765450, FPS 423, episode reward nan, episode length 305
Time 18h 50m 10s, num steps 101790869, FPS 423, episode reward -3403.355944223571, episode length 141
Time 18h 51m 10s, num steps 101816699, FPS 423, episod

Time 20h 09m 11s, num steps 103542013, FPS 422, episode reward nan, episode length 134
Time 20h 10m 12s, num steps 103564019, FPS 422, episode reward nan, episode length 323
Time 20h 11m 13s, num steps 103586029, FPS 422, episode reward -4357.063402251657, episode length 181
Time 20h 12m 14s, num steps 103607702, FPS 422, episode reward nan, episode length 131
Time 20h 13m 15s, num steps 103629898, FPS 422, episode reward -5430.409894209772, episode length 368
Time 20h 14m 16s, num steps 103651568, FPS 422, episode reward nan, episode length 135
Time 20h 15m 16s, num steps 103673193, FPS 422, episode reward nan, episode length 131
Time 20h 16m 17s, num steps 103695042, FPS 422, episode reward nan, episode length 131
Time 20h 17m 18s, num steps 103716823, FPS 422, episode reward nan, episode length 135
Time 20h 18m 18s, num steps 103739039, FPS 422, episode reward nan, episode length 102
Time 20h 19m 19s, num steps 103760724, FPS 422, episode reward nan, episode length 129
Time 20h 20m 

Time 21h 34m 45s, num steps 105412429, FPS 421, episode reward -2382.0316954362584, episode length 101
Time 21h 35m 46s, num steps 105434474, FPS 421, episode reward -4870.9847189795055, episode length 204
Time 21h 36m 48s, num steps 105457274, FPS 421, episode reward -5434.724211913019, episode length 394
Time 21h 37m 48s, num steps 105479052, FPS 421, episode reward -2359.628501009234, episode length 100
Time 21h 38m 48s, num steps 105501154, FPS 421, episode reward -2359.628501009234, episode length 100
Time 21h 39m 49s, num steps 105522695, FPS 421, episode reward nan, episode length 126
Time 21h 40m 50s, num steps 105544724, FPS 421, episode reward -2359.628501009234, episode length 100
Time 21h 41m 50s, num steps 105566843, FPS 421, episode reward -3378.4052898361065, episode length 140
Time 21h 42m 51s, num steps 105589707, FPS 421, episode reward -2359.628501009234, episode length 100
Time 21h 43m 52s, num steps 105612156, FPS 421, episode reward -5446.844992857843, episode len

Time 22h 59m 15s, num steps 107266065, FPS 420, episode reward nan, episode length 149
Time 23h 00m 16s, num steps 107288358, FPS 420, episode reward -4334.75905684863, episode length 180
Time 23h 01m 16s, num steps 107310336, FPS 420, episode reward -3251.518648333766, episode length 135
Time 23h 02m 18s, num steps 107332958, FPS 420, episode reward -5427.923585158258, episode length 353
Time 23h 03m 19s, num steps 107355743, FPS 420, episode reward -5432.732281905084, episode length 382
Time 23h 04m 21s, num steps 107378239, FPS 420, episode reward -5449.335581999689, episode length 482
Time 23h 05m 22s, num steps 107400280, FPS 420, episode reward -2359.628501009234, episode length 100
Time 23h 06m 23s, num steps 107423177, FPS 420, episode reward -5432.234442931085, episode length 379
Time 23h 07m 25s, num steps 107445872, FPS 420, episode reward -5426.431864958673, episode length 344
Time 23h 08m 25s, num steps 107468117, FPS 420, episode reward -3428.074237175142, episode length 

Time 00h 23m 38s, num steps 109122055, FPS 419, episode reward -2359.628501009234, episode length 100
Time 00h 24m 38s, num steps 109143936, FPS 419, episode reward -3145.799187608007, episode length 131
Time 00h 25m 39s, num steps 109166261, FPS 419, episode reward -3981.033210450378, episode length 166
Time 00h 26m 40s, num steps 109188253, FPS 419, episode reward -2359.628501009234, episode length 100
Time 00h 27m 40s, num steps 109210305, FPS 419, episode reward -3199.2425101473264, episode length 133
Time 00h 28m 41s, num steps 109232379, FPS 419, episode reward nan, episode length 133
Time 00h 29m 42s, num steps 109254727, FPS 419, episode reward -5435.388308745294, episode length 398
Time 00h 30m 43s, num steps 109276882, FPS 419, episode reward nan, episode length 137
Time 00h 31m 43s, num steps 109299397, FPS 419, episode reward -2359.628501009234, episode length 100
Time 00h 32m 44s, num steps 109321356, FPS 419, episode reward nan, episode length 137
Time 00h 33m 45s, num st

Time 01h 47m 56s, num steps 110969157, FPS 418, episode reward -2359.628501009234, episode length 100
Time 01h 48m 56s, num steps 110991893, FPS 418, episode reward -3378.4052898361065, episode length 140
Time 01h 49m 57s, num steps 111015101, FPS 418, episode reward -2359.628501009234, episode length 100
Time 01h 50m 58s, num steps 111038303, FPS 418, episode reward -5438.210868101984, episode length 415
Time 01h 51m 59s, num steps 111061041, FPS 418, episode reward -3592.7193457545322, episode length 149
Time 01h 53m 00s, num steps 111082729, FPS 418, episode reward -2359.628501009234, episode length 100
Time 01h 54m 00s, num steps 111105020, FPS 418, episode reward -2359.628501009234, episode length 100
Time 01h 55m 01s, num steps 111127341, FPS 418, episode reward -3118.7238517477576, episode length 130
Time 01h 56m 01s, num steps 111149029, FPS 418, episode reward -2359.628501009234, episode length 100
Time 01h 57m 02s, num steps 111171379, FPS 418, episode reward nan, episode len

Time 03h 11m 31s, num steps 112813080, FPS 417, episode reward -5434.558196288019, episode length 393
Time 03h 12m 32s, num steps 112835847, FPS 417, episode reward -2382.0316954362584, episode length 101
Time 03h 13m 32s, num steps 112857916, FPS 417, episode reward -2473.2160182689036, episode length 105
Time 03h 14m 33s, num steps 112880226, FPS 417, episode reward nan, episode length 101
Time 03h 15m 33s, num steps 112902741, FPS 417, episode reward nan, episode length 102
Time 03h 16m 34s, num steps 112925269, FPS 417, episode reward -2359.628501009234, episode length 100
Time 03h 17m 34s, num steps 112947122, FPS 417, episode reward nan, episode length 102
Time 03h 18m 36s, num steps 112969012, FPS 417, episode reward -5433.728154402643, episode length 388
Time 03h 19m 37s, num steps 112991286, FPS 417, episode reward -5434.226170760065, episode length 391
Time 03h 20m 39s, num steps 113013358, FPS 417, episode reward -5434.392182570367, episode length 392
Time 03h 21m 40s, num s

Time 04h 35m 00s, num steps 114646376, FPS 416, episode reward -2359.628501009234, episode length 100
Time 04h 36m 02s, num steps 114668743, FPS 416, episode reward -5441.199610930353, episode length 433
Time 04h 37m 03s, num steps 114691161, FPS 416, episode reward -3547.6787915895197, episode length 147
Time 04h 38m 05s, num steps 114713857, FPS 416, episode reward -5440.203368407159, episode length 427
Time 04h 39m 06s, num steps 114736216, FPS 416, episode reward -5440.535456877618, episode length 429
Time 04h 40m 07s, num steps 114758417, FPS 416, episode reward -2359.628501009234, episode length 100
Time 04h 41m 09s, num steps 114780806, FPS 416, episode reward -5441.531691771417, episode length 435
Time 04h 42m 10s, num steps 114803308, FPS 416, episode reward -5445.018555861383, episode length 456
Time 04h 43m 12s, num steps 114825815, FPS 416, episode reward -5431.404910307794, episode length 374
Time 04h 44m 13s, num steps 114848135, FPS 416, episode reward -5431.239041548639

Time 05h 59m 34s, num steps 116491605, FPS 415, episode reward -4738.3498260679935, episode length 198
Time 06h 00m 35s, num steps 116514123, FPS 415, episode reward -5431.736685973077, episode length 376
Time 06h 01m 37s, num steps 116536883, FPS 415, episode reward -5441.86377451983, episode length 437
Time 06h 02m 38s, num steps 116559255, FPS 415, episode reward -5430.409894209772, episode length 368
Time 06h 03m 40s, num steps 116581369, FPS 415, episode reward -5430.575690489679, episode length 369
Time 06h 04m 41s, num steps 116603192, FPS 415, episode reward -4287.1203791415755, episode length 178
Time 06h 05m 42s, num steps 116625520, FPS 415, episode reward -4488.792569992787, episode length 187
Time 06h 06m 42s, num steps 116647528, FPS 415, episode reward -4210.404950313592, episode length 175
Time 06h 07m 44s, num steps 116669653, FPS 415, episode reward -5428.4209644612365, episode length 356
Time 06h 08m 45s, num steps 116692381, FPS 415, episode reward -5432.06851313677

Time 07h 22m 10s, num steps 118305154, FPS 414, episode reward -5440.535456877618, episode length 429
Time 07h 23m 12s, num steps 118327826, FPS 414, episode reward -5464.943286162286, episode length 576
Time 07h 24m 14s, num steps 118350586, FPS 414, episode reward -5440.701497298151, episode length 430
Time 07h 25m 14s, num steps 118372354, FPS 414, episode reward -3091.4665125086394, episode length 129
Time 07h 26m 16s, num steps 118394833, FPS 414, episode reward -5439.8712799367, episode length 425
Time 07h 27m 16s, num steps 118417136, FPS 414, episode reward -3724.853477893684, episode length 155
Time 07h 28m 19s, num steps 118440029, FPS 414, episode reward -5465.10932467547, episode length 577
Time 07h 29m 20s, num steps 118462524, FPS 414, episode reward -5371.802561041384, episode length 231
Time 07h 30m 21s, num steps 118484732, FPS 414, episode reward -4334.75905684863, episode length 180
Time 07h 31m 22s, num steps 118507093, FPS 414, episode reward -5431.570790511041, ep

Time 08h 46m 52s, num steps 120152031, FPS 413, episode reward nan, episode length 103
Time 08h 47m 53s, num steps 120174226, FPS 413, episode reward nan, episode length 104
Time 08h 48m 55s, num steps 120196613, FPS 413, episode reward -5438.8750297841125, episode length 419
Time 08h 49m 57s, num steps 120217443, FPS 413, episode reward -5432.068513136774, episode length 378
Time 08h 50m 59s, num steps 120237650, FPS 413, episode reward -5435.554331999689, episode length 399
Time 08h 52m 01s, num steps 120258282, FPS 413, episode reward -5431.239041548639, episode length 373
Time 08h 53m 01s, num steps 120276908, FPS 413, episode reward -2404.58579547247, episode length 102
Time 08h 54m 02s, num steps 120295954, FPS 413, episode reward -4287.1203791415755, episode length 178
Time 08h 55m 04s, num steps 120315539, FPS 413, episode reward -5447.343110304742, episode length 470
Time 08h 56m 05s, num steps 120335012, FPS 413, episode reward nan, episode length 106
Time 08h 57m 06s, num st

Time 10h 14m 41s, num steps 121680163, FPS 411, episode reward -5448.007264357477, episode length 474
Time 10h 15m 42s, num steps 121697724, FPS 411, episode reward -5445.018555861383, episode length 456
Time 10h 16m 45s, num steps 121715536, FPS 411, episode reward -5465.2753631886535, episode length 578
Time 10h 17m 45s, num steps 121732067, FPS 411, episode reward nan, episode length 135
Time 10h 18m 46s, num steps 121748906, FPS 411, episode reward nan, episode length 130
Time 10h 19m 47s, num steps 121766555, FPS 411, episode reward -5437.546712141901, episode length 411
Time 10h 20m 50s, num steps 121784379, FPS 411, episode reward -5464.113101225763, episode length 571
Time 10h 21m 50s, num steps 121801711, FPS 411, episode reward nan, episode length 135
Time 10h 22m 52s, num steps 121819671, FPS 411, episode reward -5463.614995222955, episode length 568
Time 10h 23m 53s, num steps 121837066, FPS 411, episode reward -3428.074237175142, episode length 142
Time 10h 24m 53s, num st

Time 11h 39m 58s, num steps 123147102, FPS 409, episode reward nan, episode length 103
Time 11h 40m 59s, num steps 123164472, FPS 409, episode reward -3251.518648333766, episode length 135
Time 11h 42m 00s, num steps 123182192, FPS 409, episode reward -5426.100529890924, episode length 342
Time 11h 43m 00s, num steps 123199416, FPS 409, episode reward nan, episode length 103
Time 11h 44m 01s, num steps 123217077, FPS 409, episode reward -5426.100529890924, episode length 342
Time 11h 45m 02s, num steps 123234639, FPS 409, episode reward -3302.5937644912797, episode length 137
Time 11h 46m 02s, num steps 123252221, FPS 409, episode reward -3327.9670707656865, episode length 138
Time 11h 47m 04s, num steps 123269893, FPS 409, episode reward -5426.100529890924, episode length 342
Time 11h 48m 04s, num steps 123287524, FPS 409, episode reward nan, episode length 134
Time 11h 49m 06s, num steps 123304659, FPS 409, episode reward -5428.586753111749, episode length 357
Time 11h 50m 07s, num s

Time 13h 02m 02s, num steps 124600873, FPS 407, episode reward -3452.5957993937895, episode length 143
Time 13h 03m 03s, num steps 124618615, FPS 407, episode reward -3428.074237175142, episode length 142
Time 13h 04m 04s, num steps 124635951, FPS 407, episode reward -3353.24075824756, episode length 139
Time 13h 05m 05s, num steps 124653749, FPS 407, episode reward -5435.720357161432, episode length 400
Time 13h 06m 06s, num steps 124671201, FPS 407, episode reward -3428.074237175142, episode length 142
Time 13h 07m 06s, num steps 124688596, FPS 407, episode reward -3403.355944223571, episode length 141
Time 13h 08m 07s, num steps 124705706, FPS 407, episode reward -3403.355944223571, episode length 141
Time 13h 09m 07s, num steps 124723241, FPS 407, episode reward -3428.074237175142, episode length 142
Time 13h 10m 08s, num steps 124740691, FPS 407, episode reward -5426.597539168268, episode length 345
Time 13h 11m 10s, num steps 124758337, FPS 407, episode reward -5430.741503935724,

Time 14h 24m 18s, num steps 126017376, FPS 405, episode reward -2637.681960530777, episode length 112
Time 14h 25m 19s, num steps 126034826, FPS 405, episode reward -3199.2425101473264, episode length 133
Time 14h 26m 19s, num steps 126052476, FPS 405, episode reward -3199.2425101473264, episode length 133
Time 14h 27m 20s, num steps 126069871, FPS 405, episode reward -3172.6484010889517, episode length 132
Time 14h 28m 20s, num steps 126086301, FPS 405, episode reward -3199.2425101473264, episode length 133
Time 14h 29m 21s, num steps 126103496, FPS 405, episode reward -3172.6484010889517, episode length 132
Time 14h 30m 21s, num steps 126119926, FPS 405, episode reward -3277.171001143663, episode length 136
Time 14h 31m 22s, num steps 126136101, FPS 405, episode reward -3199.2425101473264, episode length 133
Time 14h 32m 23s, num steps 126152847, FPS 405, episode reward -5435.388308745294, episode length 398
Time 14h 33m 25s, num steps 126169762, FPS 405, episode reward -5446.5129177

Time 15h 45m 13s, num steps 127393533, FPS 403, episode reward -3036.374576158774, episode length 127
Time 15h 46m 14s, num steps 127411807, FPS 403, episode reward -3036.374576158774, episode length 127
Time 15h 47m 15s, num steps 127430181, FPS 403, episode reward -5441.033574324518, episode length 432
Time 15h 48m 16s, num steps 127448145, FPS 403, episode reward -2427.3117211560943, episode length 103
Time 15h 49m 16s, num steps 127466086, FPS 403, episode reward nan, episode length 103
Time 15h 50m 18s, num steps 127484313, FPS 403, episode reward -5452.988438826471, episode length 504
Time 15h 51m 19s, num steps 127502764, FPS 403, episode reward -5448.007264357477, episode length 474
Time 15h 52m 20s, num steps 127520436, FPS 403, episode reward -2473.2160182689036, episode length 105
Time 15h 53m 21s, num steps 127538608, FPS 403, episode reward -4311.391180922448, episode length 179
Time 15h 54m 21s, num steps 127556315, FPS 403, episode reward -4334.75905684863, episode lengt

Time 17h 07m 06s, num steps 128797924, FPS 401, episode reward -3225.541353650318, episode length 134
Time 17h 08m 06s, num steps 128815362, FPS 401, episode reward -3225.541353650318, episode length 134
Time 17h 09m 07s, num steps 128832980, FPS 401, episode reward -3225.541353650318, episode length 134
Time 17h 10m 07s, num steps 128850385, FPS 401, episode reward -2519.5420729605826, episode length 107
Time 17h 11m 08s, num steps 128867831, FPS 401, episode reward -3199.2425101473264, episode length 133
Time 17h 12m 08s, num steps 128884917, FPS 401, episode reward -3225.541353650318, episode length 134
Time 17h 13m 09s, num steps 128902437, FPS 401, episode reward -3225.541353650318, episode length 134
Time 17h 14m 09s, num steps 128919975, FPS 401, episode reward -3251.518648333766, episode length 135
Time 17h 15m 10s, num steps 128937426, FPS 401, episode reward nan, episode length 118
Time 17h 16m 10s, num steps 128955122, FPS 401, episode reward -3251.518648333766, episode leng

### 4. Watch a Smart Agent!

In [None]:
agent.actor_local.load_state_dict(torch.load('checkpoint_actor.pth'))
agent.critic_local.load_state_dict(torch.load('checkpoint_critic.pth'))

state = env.reset()
for t in range(200):
    action = agent.act(state, add_noise=False)
    env.render()
    state, reward, done, _ = env.step(action)
    print(reward, done)
    if done:
        break 
img = env.render()
img.show()
#env.close()

### 6. Explore

In this exercise, we have provided a sample DDPG agent and demonstrated how to use it to solve an OpenAI Gym environment.  To continue your learning, you are encouraged to complete any (or all!) of the following tasks:
- Amend the various hyperparameters and network architecture to see if you can get your agent to solve the environment faster than this benchmark implementation.  Once you build intuition for the hyperparameters that work well with this environment, try solving a different OpenAI Gym task!
- Write your own DDPG implementation.  Use this code as reference only when needed -- try as much as you can to write your own algorithm from scratch.
- You may also like to implement prioritized experience replay, to see if it speeds learning.  
- The current implementation adds Ornsetein-Uhlenbeck noise to the action space.  However, it has [been shown](https://blog.openai.com/better-exploration-with-parameter-noise/) that adding noise to the parameters of the neural network policy can improve performance.  Make this change to the code, to verify it for yourself!
- Write a blog post explaining the intuition behind the DDPG algorithm and demonstrating how to use it to solve an RL environment of your choosing.  