In [1]:
import sys

import pytz
import importlib
import numpy as np
import pandas as pd
from pathlib import Path
from datetime import datetime

MODULE_NAME = "infer"
MAIN_PATH = "/home/sequenzia/dev/repos/atari-rl"

WANDB_ON = True
PROJECT = "Solen-Project-Eval"

NO_RENDER = True

N_ENVS = 5
N_STEPS = 100000

module_path = f"{MAIN_PATH}/utils/{MODULE_NAME}.py"
agents_path = f"{MAIN_PATH}/agents"
data_path = f"{MAIN_PATH}/data"

spec = importlib.util.spec_from_file_location(MODULE_NAME, module_path)
infer = importlib.util.module_from_spec(spec)
sys.modules[MODULE_NAME] = infer
spec.loader.exec_module(infer)

ALGOS = ["ppo"]

GAMES = ["Breakout",
         "Pong",
         "SpaceInvaders",
         "Qbert",
         "Seaquest",
         "Centipede",
         "MsPacman",
         "Asterix",
         "Asteroids",
         "Assault"]

ts = datetime.now(pytz.timezone('UTC')).astimezone(pytz.timezone('US/Eastern'))
ts = ts.strftime("%Y-%m-%d-%H-%M-%S")

for algo in ALGOS:

    for game in GAMES:

        ENV_ID = f"ALE/{game}-v5"

        RUN_KEY = f"{algo.upper()}_{game}"

        output_path = f"{data_path}/evals/{algo.upper()}_{ts}/{game.lower()}.parquet"

        Path(output_path).parent.mkdir(parents=True, exist_ok=True)

        infer_logs = infer.infer(run_key=RUN_KEY,
                                 env_id=ENV_ID,
                                 algo=algo,
                                 game=game,
                                 agents_path=agents_path,
                                 n_envs=N_ENVS,
                                 n_steps=N_STEPS,
                                 no_render=NO_RENDER,
                                 project=PROJECT,
                                 wandb_on=WANDB_ON,
                                 debug_on=False)

        infer_data_np = np.empty((0, 5))

        for idx in range(len(infer_logs)):

            infer_data_np = np.vstack((infer_data_np,
                                       np.array([infer_logs[idx].scores,
                                                 infer_logs[idx].times,
                                                 infer_logs[idx].lengths,
                                                 infer_logs[idx].frame_numbers,
                                                 infer_logs[idx].run_frame_numbers]).T))

        infer_data = pd.DataFrame(infer_data_np,
                                  columns=["scores",
                                           "times",
                                           "lengths",
                                           "frame_numbers",
                                           "run_frame_numbers"])

        infer_data["run_key"] = RUN_KEY
        infer_data["game"] = game
        infer_data["algo"] = algo
        infer_data["ts"] = ts

        print(f"Saving to {output_path}")
        infer_data.to_parquet(output_path)
        



Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-Breakout-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_Breakout: 1 EPISODE: 1
Episode Score: 32.00
Episode Length: 907


PPO_Breakout: 4 EPISODE: 1
Episode Score: 45.00
Episode Length: 1047


PPO_Breakout: 5 EPISODE: 1
Episode Score: 40.00
Episode Length: 1169


PPO_Breakout: 2 EPISODE: 1
Episode Score: 67.00
Episode Length: 1227


PPO_Breakout: 3 EPISODE: 1
Episode Score: 69.00
Episode Length: 1454


PPO_Breakout: 5 EPISODE: 2
Episode Score: 23.00
Episode Length: 870


PPO_Breakout: 1 EPISODE: 2
Episode Score: 40.00
Episode Length: 1159


PPO_Breakout: 2 EPISODE: 2
Episode Score: 23.00
Episode Length: 826


PPO_Breakout: 4 EPISODE: 2
Episode Score: 47.00
Episode Length: 1223


PPO_Breakout: 5 EPISODE: 3
Episode Score: 13.00
Episode Length: 503


PPO_Breakout: 3 EPISODE: 2
Episode Score: 58.00
Episode Length: 1289


PPO_Breakout: 1 EPISODE: 3
Episode Score: 21.00
Episode Length: 819


PPO_Breakout: 2 EPISODE: 3
Episode Score: 28.00
Episode Length: 1136


PPO_Breakout: 4 EPISODE: 3
Episode Score: 39.00
Episode Length

Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: Currently logged in as: [33mappliedtheta[0m. Use [1m`wandb login --relogin`[0m to force relogin


VBox(children=(Label(value='0.002 MB of 0.002 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
PPO_Breakout/episode_length,▄▆▁▄▁▁█▆▇▃██▄▂▄▆▇▄▆▅▇▅▆▄▆▆▇▃█▃▃▆▆▆▂▅▇▂▆▅
PPO_Breakout/episode_score,▃▃▁▃▁▁█▄▆▂▅▇▃▂▄▅▅▅▅▄▆▄▅▃▄▆▇▃▇▂▂▆▃▆▁▃▇▂▅▄
episode_length,▄▆▁▄▁▁█▆▇▃██▄▂▄▆▇▄▆▅▇▅▆▄▆▆▇▃█▃▃▆▆▆▂▅▇▂▆▅
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,▃▃▁▃▁▁█▄▆▂▅▇▃▂▄▅▅▅▅▄▆▄▅▃▄▆▇▃▇▂▂▆▃▆▁▃▇▂▅▄
episode_time,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
run_frame_number,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███

0,1
PPO_Breakout/episode_length,1014.0
PPO_Breakout/episode_score,37.0
episode_length,1014.0
episode_lives,0.0
episode_score,37.0
episode_time,1249.17547
run_frame_number,1714492.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/breakout.parquet

Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-Pong-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_Pong: 1 EPISODE: 1
Episode Score: 9.00
Episode Length: 4478


PPO_Pong: 2 EPISODE: 1
Episode Score: -5.00
Episode Length: 5823


PPO_Pong: 5 EPISODE: 1
Episode Score: 5.00
Episode Length: 5973


PPO_Pong: 3 EPISODE: 1
Episode Score: 1.00
Episode Length: 6390


PPO_Pong: 4 EPISODE: 1
Episode Score: 5.00
Episode Length: 7082


PPO_Pong: 1 EPISODE: 2
Episode Score: -3.00
Episode Length: 6354


PPO_Pong: 3 EPISODE: 2
Episode Score: 7.00
Episode Length: 4683


PPO_Pong: 2 EPISODE: 2
Episode Score: 4.00
Episode Length: 5340


PPO_Pong: 4 EPISODE: 2
Episode Score: 9.00
Episode Length: 4333


PPO_Pong: 5 EPISODE: 2
Episode Score: 4.00
Episode Length: 5831


PPO_Pong: 5 EPISODE: 3
Episode Score: -10.00
Episode Length: 4503


PPO_Pong: 4 EPISODE: 3
Episode Score: 8.00
Episode Length: 4940


PPO_Pong: 3 EPISODE: 3
Episode Score: -5.00
Episode Length: 5305


PPO_Pong: 1 EPISODE: 3
Episode Score: 7.00
Episode Length: 5779


PPO_Pong: 2 EPISODE: 3
Episode Score: 8.00
Episode 

VBox(children=(Label(value='0.002 MB of 0.008 MB uploaded\r'), FloatProgress(value=0.2789665376735716, max=1.0…

0,1
PPO_Pong/episode_length,▆▃▇▆▂▆▃▅▂▂▂▅▁▃▂▅▄▆▅▇▅▁▇▂▇▅▆▂▃▃▄▃█▄▁▁▇▅▂▅
PPO_Pong/episode_score,▃▆▄▄▁▃▂▃▅▁▇▅▆▃█▂▃▄▆▃▂▇▃▄▅▅▃▅▅▅▆▃▃▂▆▆▃▅▆▇
episode_length,▆▃▇▆▂▆▃▅▂▂▂▅▁▃▂▅▄▆▅▇▅▁▇▂▇▅▆▂▃▃▄▃█▄▁▁▇▅▂▅
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,▃▆▄▄▁▃▂▃▅▁▇▅▆▃█▂▃▄▆▃▂▇▃▄▅▅▃▅▅▅▆▃▃▂▆▆▃▅▆▇
episode_time,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
run_frame_number,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███

0,1
PPO_Pong/episode_length,5884.0
PPO_Pong/episode_score,11.0
episode_length,5884.0
episode_lives,0.0
episode_score,11.0
episode_time,1088.82102
run_frame_number,1606200.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/pong.parquet

Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-SpaceInvaders-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_SpaceInvaders: 3 EPISODE: 1
Episode Score: 600.00
Episode Length: 1077


PPO_SpaceInvaders: 1 EPISODE: 1
Episode Score: 1155.00
Episode Length: 1266


PPO_SpaceInvaders: 2 EPISODE: 1
Episode Score: 1115.00
Episode Length: 1468


PPO_SpaceInvaders: 5 EPISODE: 1
Episode Score: 1350.00
Episode Length: 1494


PPO_SpaceInvaders: 4 EPISODE: 1
Episode Score: 1100.00
Episode Length: 1832


PPO_SpaceInvaders: 5 EPISODE: 2
Episode Score: 580.00
Episode Length: 957


PPO_SpaceInvaders: 3 EPISODE: 2
Episode Score: 1340.00
Episode Length: 1415


PPO_SpaceInvaders: 1 EPISODE: 2
Episode Score: 1295.00
Episode Length: 1260


PPO_SpaceInvaders: 2 EPISODE: 2
Episode Score: 1155.00
Episode Length: 1483


PPO_SpaceInvaders: 5 EPISODE: 3
Episode Score: 550.00
Episode Length: 789


PPO_SpaceInvaders: 4 EPISODE: 2
Episode Score: 1350.00
Episode Length: 1383


PPO_SpaceInvaders: 1 EPISODE: 3
Episode Score: 1185.00
Episode Length: 1219


PPO_SpaceInvaders: 3 EPISODE: 3
Episode Score: 12

VBox(children=(Label(value='0.002 MB of 0.002 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
PPO_SpaceInvaders/episode_length,▂▆▅▃▁▄▅██▆▆▆▆▄▆▅▂▃▅▅▄▆▆▂▅▄▆▁▁▇▃▆▅▄▃▅▃▆▅▇
PPO_SpaceInvaders/episode_score,▄▅▆▂▂▄▅▆▇▄▆▆▅▇▇▄▃▂▇▅▄▅▇▂▆▅▆▁▁█▄▇▆▄▃▄▃▇▆▅
episode_length,▂▆▅▃▁▄▅██▆▆▆▆▄▆▅▂▃▅▅▄▆▆▂▅▄▆▁▁▇▃▆▅▄▃▅▃▆▅▇
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,▄▅▆▂▂▄▅▆▇▄▆▆▅▇▇▄▃▂▇▅▄▅▇▂▆▅▆▁▁█▄▇▆▄▃▄▃▇▆▅
episode_time,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
run_frame_number,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███

0,1
PPO_SpaceInvaders/episode_length,1325.0
PPO_SpaceInvaders/episode_score,975.0
episode_length,1325.0
episode_lives,0.0
episode_score,975.0
episode_time,1132.5068
run_frame_number,1657828.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/spaceinvaders.parquet

Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-Qbert-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_Qbert: 2 EPISODE: 1
Episode Score: 7750.00
Episode Length: 1241


PPO_Qbert: 1 EPISODE: 1
Episode Score: 16825.00
Episode Length: 2170


PPO_Qbert: 3 EPISODE: 1
Episode Score: 28900.00
Episode Length: 3482


PPO_Qbert: 5 EPISODE: 1
Episode Score: 29075.00
Episode Length: 3680


PPO_Qbert: 4 EPISODE: 1
Episode Score: 28500.00
Episode Length: 3789


PPO_Qbert: 2 EPISODE: 2
Episode Score: 29425.00
Episode Length: 3620


PPO_Qbert: 1 EPISODE: 2
Episode Score: 29375.00
Episode Length: 3636


PPO_Qbert: 2 EPISODE: 3
Episode Score: 4375.00
Episode Length: 1005


PPO_Qbert: 3 EPISODE: 2
Episode Score: 16525.00
Episode Length: 2500


PPO_Qbert: 5 EPISODE: 2
Episode Score: 28775.00
Episode Length: 3395


PPO_Qbert: 4 EPISODE: 2
Episode Score: 29450.00
Episode Length: 3563


PPO_Qbert: 1 EPISODE: 3
Episode Score: 16425.00
Episode Length: 2395


PPO_Qbert: 3 EPISODE: 3
Episode Score: 19700.00
Episode Length: 2445


PPO_Qbert: 2 EPISODE: 4
Episode Score: 29425.00
Episode Len

VBox(children=(Label(value='0.002 MB of 0.002 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
PPO_Qbert/episode_length,▁▇▇▇▇▇▇▇▇█▇▆▇▇█▇▇▇▆▇▇▄▇▆▇██▄▇█▇██▆▆█▇▇▇▆
PPO_Qbert/episode_score,▁████▇█████▇██████▇██▅█▇███▄█████▅▆▇████
episode_length,▁▇▇▇▇▇▇▇▇█▇▆▇▇█▇▇▇▆▇▇▄▇▆▇██▄▇█▇██▆▆█▇▇▇▆
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,▁████▇█████▇██████▇██▅█▇███▄█████▅▆▇████
episode_time,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
run_frame_number,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███

0,1
PPO_Qbert/episode_length,2775.0
PPO_Qbert/episode_score,23250.0
episode_length,2775.0
episode_lives,0.0
episode_score,23250.0
episode_time,1163.072
run_frame_number,1624621.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/qbert.parquet

Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-Seaquest-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_Seaquest: 2 EPISODE: 1
Episode Score: 1800.00
Episode Length: 2255


PPO_Seaquest: 5 EPISODE: 1
Episode Score: 2720.00
Episode Length: 2439


PPO_Seaquest: 4 EPISODE: 1
Episode Score: 2180.00
Episode Length: 2743


PPO_Seaquest: 1 EPISODE: 1
Episode Score: 3460.00
Episode Length: 3047


PPO_Seaquest: 3 EPISODE: 1
Episode Score: 3760.00
Episode Length: 3103


PPO_Seaquest: 2 EPISODE: 2
Episode Score: 2180.00
Episode Length: 2759


PPO_Seaquest: 4 EPISODE: 2
Episode Score: 2000.00
Episode Length: 2503


PPO_Seaquest: 5 EPISODE: 2
Episode Score: 3260.00
Episode Length: 2883


PPO_Seaquest: 3 EPISODE: 2
Episode Score: 3280.00
Episode Length: 2783


PPO_Seaquest: 1 EPISODE: 2
Episode Score: 4200.00
Episode Length: 3367


PPO_Seaquest: 4 EPISODE: 3
Episode Score: 1800.00
Episode Length: 2367


PPO_Seaquest: 2 EPISODE: 3
Episode Score: 3580.00
Episode Length: 3007


PPO_Seaquest: 5 EPISODE: 3
Episode Score: 4080.00
Episode Length: 3343


PPO_Seaquest: 3 EPISODE: 3
Epis

VBox(children=(Label(value='0.002 MB of 0.002 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
PPO_Seaquest/episode_length,▅▂▄▅▇▇▅▅▅▃▅▇▃▅▇▃▄▇▃▁▆▅█▇▇▇▆▇▇▃▃▆▂▆▃▇▅▂▅▅
PPO_Seaquest/episode_score,▅▃▅▆▇▇▅▃▃▂▆▇▂▅█▃▄█▂▁▆▃█▇▇▇▅▇▇▄▂▆▁▆▂▆▆▂▃▅
episode_length,▅▂▄▅▇▇▅▅▅▃▅▇▃▅▇▃▄▇▃▁▆▅█▇▇▇▆▇▇▃▃▆▂▆▃▇▅▂▅▅
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,▅▃▅▆▇▇▅▃▃▂▆▇▂▅█▃▄█▂▁▆▃█▇▇▇▅▇▇▄▂▆▁▆▂▆▆▂▃▅
episode_time,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
run_frame_number,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███

0,1
PPO_Seaquest/episode_length,3191.0
PPO_Seaquest/episode_score,3680.0
episode_length,3191.0
episode_lives,0.0
episode_score,3680.0
episode_time,1167.31285
run_frame_number,1631390.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/seaquest.parquet

Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-Centipede-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_Centipede: 1 EPISODE: 1
Episode Score: 8017.00
Episode Length: 851


PPO_Centipede: 3 EPISODE: 1
Episode Score: 6922.00
Episode Length: 1182


PPO_Centipede: 4 EPISODE: 1
Episode Score: 14014.00
Episode Length: 1731


PPO_Centipede: 5 EPISODE: 1
Episode Score: 15661.00
Episode Length: 1891


PPO_Centipede: 1 EPISODE: 2
Episode Score: 7450.00
Episode Length: 1259


PPO_Centipede: 2 EPISODE: 1
Episode Score: 17460.00
Episode Length: 2248


PPO_Centipede: 4 EPISODE: 2
Episode Score: 5382.00
Episode Length: 695


PPO_Centipede: 5 EPISODE: 2
Episode Score: 5386.00
Episode Length: 1049


PPO_Centipede: 3 EPISODE: 2
Episode Score: 11181.00
Episode Length: 1808


PPO_Centipede: 1 EPISODE: 3
Episode Score: 6305.00
Episode Length: 1208


PPO_Centipede: 4 EPISODE: 3
Episode Score: 9979.00
Episode Length: 1060


PPO_Centipede: 2 EPISODE: 2
Episode Score: 5898.00
Episode Length: 1225


PPO_Centipede: 5 EPISODE: 3
Episode Score: 7865.00
Episode Length: 1403


PPO_Centipede: 3

VBox(children=(Label(value='0.002 MB of 0.002 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
PPO_Centipede/episode_length,▅▆▅▄▃▃▁█▄▃▄▇▄▃▃▃▅▄▄▅▃▆▅▆▂▇▄▂▂▃▄▅▂▃▄▆▄▃▄▂
PPO_Centipede/episode_score,▄▇▅▅▃▄▁█▃▄▃█▄▃▄▃▅▄▄▆▃█▆█▂▇▅▂▃▄▄▄▃▃▄▇▄▄▄▃
episode_length,▅▆▅▄▃▃▁█▄▃▄▇▄▃▃▃▅▄▄▅▃▆▅▆▂▇▄▂▂▃▄▅▂▃▄▆▄▃▄▂
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,▄▇▅▅▃▄▁█▃▄▃█▄▃▄▃▅▄▄▆▃█▆█▂▇▅▂▃▄▄▄▃▃▄▇▄▄▄▃
episode_time,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
run_frame_number,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███

0,1
PPO_Centipede/episode_length,881.0
PPO_Centipede/episode_score,5316.0
episode_length,881.0
episode_lives,0.0
episode_score,5316.0
episode_time,1178.53798
run_frame_number,1653846.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/centipede.parquet

Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-MsPacman-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_MsPacman: 5 EPISODE: 1
Episode Score: 2890.00
Episode Length: 1109


PPO_MsPacman: 4 EPISODE: 1
Episode Score: 4870.00
Episode Length: 1637


PPO_MsPacman: 3 EPISODE: 1
Episode Score: 4770.00
Episode Length: 1701


PPO_MsPacman: 1 EPISODE: 1
Episode Score: 5310.00
Episode Length: 1881


PPO_MsPacman: 2 EPISODE: 1
Episode Score: 3530.00
Episode Length: 1867


PPO_MsPacman: 5 EPISODE: 2
Episode Score: 2490.00
Episode Length: 1139


PPO_MsPacman: 2 EPISODE: 2
Episode Score: 3040.00
Episode Length: 969


PPO_MsPacman: 3 EPISODE: 2
Episode Score: 2190.00
Episode Length: 1171


PPO_MsPacman: 4 EPISODE: 2
Episode Score: 2660.00
Episode Length: 1311


PPO_MsPacman: 1 EPISODE: 2
Episode Score: 5630.00
Episode Length: 1679


PPO_MsPacman: 5 EPISODE: 3
Episode Score: 4110.00
Episode Length: 1583


PPO_MsPacman: 3 EPISODE: 3
Episode Score: 4250.00
Episode Length: 1427


PPO_MsPacman: 4 EPISODE: 3
Episode Score: 4830.00
Episode Length: 1677


PPO_MsPacman: 2 EPISODE: 3
Episo

VBox(children=(Label(value='0.002 MB of 0.002 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
PPO_MsPacman/episode_length,▆▅▁▃▅▆▁▃▂▃▂█▇▃▂▃▁▄▆▆▃▅▆▂▅▅▁▄▄▆▆▄▁█▂▅▆▄▁▅
PPO_MsPacman/episode_score,▄▅▁▂▄▅▂▂▂▁▄▇▅▂▁▂▂▅█▅▂▅▅▂▆▄▁▄▄▄▅▅▂▇▂▅▅▂▁▄
episode_length,▆▅▁▃▅▆▁▃▂▃▂█▇▃▂▃▁▄▆▆▃▅▆▂▅▅▁▄▄▆▆▄▁█▂▅▆▄▁▅
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,▄▅▁▂▄▅▂▂▂▁▄▇▅▂▁▂▂▅█▅▂▅▅▂▆▄▁▄▄▄▅▅▂▇▂▅▅▂▁▄
episode_time,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
run_frame_number,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███

0,1
PPO_MsPacman/episode_length,1857.0
PPO_MsPacman/episode_score,5290.0
episode_length,1857.0
episode_lives,0.0
episode_score,5290.0
episode_time,1215.10011
run_frame_number,1622628.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/mspacman.parquet

Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-Asterix-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_Asterix: 4 EPISODE: 1
Episode Score: 1550.00
Episode Length: 881


PPO_Asterix: 5 EPISODE: 1
Episode Score: 2600.00
Episode Length: 1067


PPO_Asterix: 2 EPISODE: 1
Episode Score: 2900.00
Episode Length: 1134


PPO_Asterix: 1 EPISODE: 1
Episode Score: 3300.00
Episode Length: 1346


PPO_Asterix: 3 EPISODE: 1
Episode Score: 6000.00
Episode Length: 1832


PPO_Asterix: 2 EPISODE: 2
Episode Score: 2600.00
Episode Length: 1183


PPO_Asterix: 5 EPISODE: 2
Episode Score: 3000.00
Episode Length: 1503


PPO_Asterix: 2 EPISODE: 3
Episode Score: 1250.00
Episode Length: 661


PPO_Asterix: 3 EPISODE: 2
Episode Score: 4100.00
Episode Length: 1282


PPO_Asterix: 4 EPISODE: 2
Episode Score: 8900.00
Episode Length: 2693


PPO_Asterix: 5 EPISODE: 3
Episode Score: 3400.00
Episode Length: 1246


PPO_Asterix: 1 EPISODE: 2
Episode Score: 8900.00
Episode Length: 2603


PPO_Asterix: 2 EPISODE: 4
Episode Score: 3200.00
Episode Length: 1127


PPO_Asterix: 3 EPISODE: 3
Episode Score: 3500.

VBox(children=(Label(value='0.002 MB of 0.002 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
PPO_Asterix/episode_length,▃▂▃▅▃▅▅▃▅▂▄▃▇▃▇▅▃▄▄▂▃▃▁▃▃▄▃▃▇▇▃▅█▇▅▃▃▁▃▅
PPO_Asterix/episode_score,▂▂▃▄▂▅▅▃▅▂▄▂▇▃▇▅▃▂▃▂▃▃▁▂▂▅▃▃█▇▄▆██▅▃▃▁▂▅
episode_length,▃▂▃▅▃▅▅▃▅▂▄▃▇▃▇▅▃▄▄▂▃▃▁▃▃▄▃▃▇▇▃▅█▇▅▃▃▁▃▅
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,▂▂▃▄▂▅▅▃▅▂▄▂▇▃▇▅▃▂▃▂▃▃▁▂▂▅▃▃█▇▄▆██▅▃▃▁▂▅
episode_time,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
run_frame_number,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███

0,1
PPO_Asterix/episode_length,1193.0
PPO_Asterix/episode_score,2900.0
episode_length,1193.0
episode_lives,0.0
episode_score,2900.0
episode_time,1136.67259
run_frame_number,1623581.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/asterix.parquet

Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-Asteroids-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_Asteroids: 2 EPISODE: 1
Episode Score: 2250.00
Episode Length: 863


PPO_Asteroids: 4 EPISODE: 1
Episode Score: 2300.00
Episode Length: 903


PPO_Asteroids: 1 EPISODE: 1
Episode Score: 1950.00
Episode Length: 918


PPO_Asteroids: 5 EPISODE: 1
Episode Score: 1950.00
Episode Length: 970


PPO_Asteroids: 3 EPISODE: 1
Episode Score: 2250.00
Episode Length: 1036


PPO_Asteroids: 5 EPISODE: 2
Episode Score: 980.00
Episode Length: 471


PPO_Asteroids: 1 EPISODE: 2
Episode Score: 1490.00
Episode Length: 882


PPO_Asteroids: 4 EPISODE: 2
Episode Score: 2280.00
Episode Length: 925


PPO_Asteroids: 2 EPISODE: 2
Episode Score: 2000.00
Episode Length: 1330


PPO_Asteroids: 5 EPISODE: 3
Episode Score: 1280.00
Episode Length: 994


PPO_Asteroids: 1 EPISODE: 3
Episode Score: 2850.00
Episode Length: 1059


PPO_Asteroids: 2 EPISODE: 3
Episode Score: 1590.00
Episode Length: 706


PPO_Asteroids: 3 EPISODE: 2
Episode Score: 4020.00
Episode Length: 1816


PPO_Asteroids: 4 EPISODE: 3


VBox(children=(Label(value='0.002 MB of 0.002 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
PPO_Asteroids/episode_length,▇▂▅▄▄▄▄▄▄▄▂▆▃▃█▆▅▄▃▄▂▄▄▂▃▅▆▂▂▁▂▃▄▃▄▄▆▄▅▄
PPO_Asteroids/episode_score,█▁▅▅▄▆▅▄▇▆▁▅▂▅▇▄▄▅▆▆▁▇▄▂▆▄▅▂▁▂▂▆▃▄▃▅▇▄▄▃
episode_length,▇▂▅▄▄▄▄▄▄▄▂▆▃▃█▆▅▄▃▄▂▄▄▂▃▅▆▂▂▁▂▃▄▃▄▄▆▄▅▄
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,█▁▅▅▄▆▅▄▇▆▁▅▂▅▇▄▄▅▆▆▁▇▄▂▆▄▅▂▁▂▂▆▃▄▃▅▇▄▄▃
episode_time,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
run_frame_number,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███

0,1
PPO_Asteroids/episode_length,566.0
PPO_Asteroids/episode_score,1080.0
episode_length,566.0
episode_lives,0.0
episode_score,1080.0
episode_time,1220.29919
run_frame_number,1706678.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/asteroids.parquet

Loading ----> /home/sequenzia/dev/repos/atari-rl/agents/ppo/ALE-Assault-v5_1/best_model.zip



A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]
A.L.E: Arcade Learning Environment (version 0.8.1+53f58b7)
[Powered by Stella]


Stacking 4 frames


PPO_Assault: 2 EPISODE: 1
Episode Score: 1182.00
Episode Length: 1697


PPO_Assault: 4 EPISODE: 1
Episode Score: 3092.00
Episode Length: 3682


PPO_Assault: 1 EPISODE: 1
Episode Score: 3258.00
Episode Length: 3780


PPO_Assault: 5 EPISODE: 1
Episode Score: 3731.00
Episode Length: 4582


PPO_Assault: 3 EPISODE: 1
Episode Score: 4866.00
Episode Length: 5278


PPO_Assault: 2 EPISODE: 2
Episode Score: 4501.00
Episode Length: 5249


PPO_Assault: 1 EPISODE: 2
Episode Score: 3080.00
Episode Length: 3750


PPO_Assault: 5 EPISODE: 2
Episode Score: 3152.00
Episode Length: 3875


PPO_Assault: 4 EPISODE: 2
Episode Score: 6861.00
Episode Length: 7346


PPO_Assault: 3 EPISODE: 2
Episode Score: 4953.00
Episode Length: 5761


PPO_Assault: 2 EPISODE: 3
Episode Score: 4401.00
Episode Length: 5025


PPO_Assault: 5 EPISODE: 3
Episode Score: 3559.00
Episode Length: 4197


PPO_Assault: 4 EPISODE: 3
Episode Score: 1541.00
Episode Length: 1953


PPO_Assault: 3 EPISODE: 3
Episode Score: 198

VBox(children=(Label(value='0.002 MB of 0.009 MB uploaded\r'), FloatProgress(value=0.26988137082601055, max=1.…

0,1
PPO_Assault/episode_length,▅▃▃▅▄▆▄▆▄▄▇▃▄▄▄▄█▄▆▄▃▅▄▄▄▆▅▅▄▆▅▃▁▆▆▅▂▄▅▄
PPO_Assault/episode_score,▄▃▃▅▃▆▃▅▃▄█▃▃▄▃▃█▄▅▃▃▅▄▄▄▅▄▅▄▅▅▃▁▅▅▅▁▃▄▄
episode_length,▅▃▃▅▄▆▄▆▄▄▇▃▄▄▄▄█▄▆▄▃▅▄▄▄▆▅▅▄▆▅▃▁▆▆▅▂▄▅▄
episode_lives,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
episode_score,▄▃▃▅▃▆▃▅▃▄█▃▃▄▃▃█▄▅▃▃▅▄▄▄▅▄▅▄▅▅▃▁▅▅▅▁▃▄▄
episode_time,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
run_frame_number,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███

0,1
PPO_Assault/episode_length,3781.0
PPO_Assault/episode_score,3007.0
episode_length,3781.0
episode_lives,0.0
episode_score,3007.0
episode_time,909.70243
run_frame_number,1620579.0


Saving to /home/sequenzia/dev/repos/atari-rl/data/evals/PPO_2024-02-14-14-40-20/assault.parquet
