
Example of using RLlib's debug callbacks.<br>
Here we use callbacks to track the average CartPole pole angle magnitude as a<br>
custom metric.<br>


In [1]:
from typing import Dict, Tuple
import argparse
import numpy as np
import os

In [2]:
import ray
from ray import air, tune
from ray.rllib.algorithms.callbacks import DefaultCallbacks
from ray.rllib.env import BaseEnv
from ray.rllib.evaluation import Episode, RolloutWorker
from ray.rllib.policy import Policy
from ray.rllib.policy.sample_batch import SampleBatch

In [3]:
parser = argparse.ArgumentParser()
parser.add_argument(
    "--framework",
    choices=["tf", "tf2", "torch"],
    default="torch",
    help="The DL framework specifier.",
)
parser.add_argument("--stop-iters", type=int, default=2000)

_StoreAction(option_strings=['--stop-iters'], dest='stop_iters', nargs=None, const=None, default=2000, type=<class 'int'>, choices=None, required=False, help=None, metavar=None)

In [4]:
class MyCallbacks(DefaultCallbacks):
    def on_episode_start(
        self,
        *,
        worker: RolloutWorker,
        base_env: BaseEnv,
        policies: Dict[str, Policy],
        episode: Episode,
        env_index: int,
        **kwargs
    ):
        # Make sure this episode has just been started (only initial obs
        # logged so far).
        assert episode.length == 0, (
            "ERROR: `on_episode_start()` callback should be called right "
            "after env reset!"
        )
        print("episode {} (env-idx={}) started.".format(episode.episode_id, env_index))
        episode.user_data["distance"] = []
        episode.hist_data["distance"] = []
    def on_episode_step(
        self,
        *,
        worker: RolloutWorker,
        base_env: BaseEnv,
        policies: Dict[str, Policy],
        episode: Episode,
        env_index: int,
        **kwargs
    ):
        # Make sure this episode is ongoing.
        assert episode.length > 0, (
            "ERROR: `on_episode_step()` callback should not be called right "
            "after env reset!"
        )
        pole_angle = abs(episode.last_observation_for()[2])
        raw_angle = abs(episode.last_raw_obs_for()[2])

        episode.user_data["distance"].append(pole_angle)
    def on_episode_end(
        self,
        *,
        worker: RolloutWorker,
        base_env: BaseEnv,
        policies: Dict[str, Policy],
        episode: Episode,
        env_index: int,
        **kwargs
    ):
        # Check if there are multiple episodes in a batch, i.e.
        # "batch_mode": "truncate_episodes".
        if worker.policy_config["batch_mode"] == "truncate_episodes":
            # Make sure this episode is really done.
            assert episode.batch_builder.policy_collectors["default_policy"].batches[
                -1
            ]["dones"][-1], (
                "ERROR: `on_episode_end()` should only be called "
                "after episode is done!"
            )
        pole_angle = np.mean(episode.user_data["distance"])
        print(
            "episode {} (env-idx={}) ended with length {} and pole "
            "angles {}".format(
                episode.episode_id, env_index, episode.length, pole_angle
            )
        )
        episode.custom_metrics["distance"] = pole_angle
        episode.hist_data["distance"] = episode.user_data["distance"]
    def on_sample_end(self, *, worker: RolloutWorker, samples: SampleBatch, **kwargs):
        print("returned sample batch of size {}".format(samples.count))
    def on_train_result(self, *, algorithm, result: dict, **kwargs):
        print(
            "Algorithm.train() result: {} -> {} episodes".format(
                algorithm, result["episodes_this_iter"]
            )
        )
        # you can mutate the result dict to add new fields to return
        result["callback_ok"] = True
    def on_learn_on_batch(
        self, *, policy: Policy, train_batch: SampleBatch, result: dict, **kwargs
    ) -> None:
        result["sum_actions_in_train_batch"] = train_batch["actions"].sum()
        print(
            "policy.learn_on_batch() result: {} -> sum actions: {}".format(
                policy, result["sum_actions_in_train_batch"]
            )
        )
    def on_postprocess_trajectory(
        self,
        *,
        worker: RolloutWorker,
        episode: Episode,
        agent_id: str,
        policy_id: str,
        policies: Dict[str, Policy],
        postprocessed_batch: SampleBatch,
        original_batches: Dict[str, Tuple[Policy, SampleBatch]],
        **kwargs
    ):
        print("postprocessed {} steps".format(postprocessed_batch.count))
        if "num_batches" not in episode.custom_metrics:
            episode.custom_metrics["num_batches"] = 0
        episode.custom_metrics["num_batches"] += 1

In [5]:
from cassie import CassieEnv
import constants as c 
import functions as f 
import numpy as np
import loader as l 
import caps as cp 
import torch
from ray.tune.registry import register_env
from ray.rllib.agents.ppo import PPOTrainer
import mediapy as media 
from loader import Loader

In [6]:
loader = Loader(logdir = "./custom_metrics/logs/", simdir = "./custom_metrics/sims/")

In [7]:
config = loader.load_config("../proto.yaml")

{'training': {'gamma': 0.99, 'lr': 0.01, 'train_batch_size': 1000, 'model': {'fcnet_hiddens': [64, 64], 'fcnet_activation': 'swish', 'vf_share_layers': False, 'free_log_std': True}, 'optimizer': {'type': 'adam', 'eps': '1e-06'}, 'use_critic': True, 'use_gae': True, 'lambda_': 0.95, 'kl_coeff': 0.2, 'sgd_minibatch_size': 200, 'num_sgd_iter': 10, 'vf_loss_coeff': 0.5, 'entropy_coeff': 0.01, 'clip_param': 0.2, 'kl_target': 0.01}, 'environment': {'env': 'cassie-v0', 'disable_env_checking': True}, 'framework': {'framework': 'torch'}, 'rollouts': {'recreate_failed_workers': True, 'num_workers': 1, 'num_envs_per_worker': 1, 'rollout_fragment_length': 'auto', 'batch_mode': 'truncate_episodes', 'observation_filter': 'NoFilter', 'reuse_actors': True}, 'evaluation': {'evaluation_interval': 2, 'evaluation_duration': 10}}


In [8]:
splitted = loader.split_config(config)

In [9]:
combined = {**splitted.get("environment",{}), **splitted.get("rollouts",{}), **splitted.get("checkpointing",{}), **splitted.get("debugging",{}), **splitted.get("training",{}), **splitted.get("framework",{}), **splitted.get("resources",{}), **splitted.get("evaluation",{})}
combined["callbacks"] = MyCallbacks

In [10]:
register_env("cassie-v0", lambda config: CassieEnv(config))

In [18]:
trainer = PPOTrainer(config=combined, env="CartPole-v1")
# trainer.callbacks = [MyCallbacks]



In [19]:
result = trainer.train()

[2m[36m(RolloutWorker pid=8196)[0m 2023-04-23 09:52:00,837	ERROR actor_manager.py:177 -- Worker exception, recreating: ERROR: `on_episode_start()` callback should be called right after env reset!
[2m[36m(RolloutWorker pid=8196)[0m Traceback (most recent call last):
[2m[36m(RolloutWorker pid=8196)[0m   File "c:\Users\Ajvendetta\AppData\Local\Programs\Python\Python310\lib\site-packages\ray\rllib\utils\actor_manager.py", line 174, in apply
[2m[36m(RolloutWorker pid=8196)[0m     return func(self, *args, **kwargs)
[2m[36m(RolloutWorker pid=8196)[0m   File "c:\Users\Ajvendetta\AppData\Local\Programs\Python\Python310\lib\site-packages\ray\rllib\execution\rollout_ops.py", line 86, in <lambda>
[2m[36m(RolloutWorker pid=8196)[0m     lambda w: w.sample(), local_worker=False, healthy_only=True
[2m[36m(RolloutWorker pid=8196)[0m   File "c:\Users\Ajvendetta\AppData\Local\Programs\Python\Python310\lib\site-packages\ray\util\tracing\tracing_helper.py", line 466, in _resume_span
[

KeyError: 'actions'

In [11]:
if __name__ == "__main__":

    ray.init(ignore_reinit_error=True)
    tuner = tune.Tuner(
        "PG",
        run_config=air.RunConfig(
            stop={
                "training_iteration": 10,
            },
        ),
        param_space={
            "env": "CartPole-v1",
            "num_envs_per_worker": 2,
            "callbacks": MyCallbacks,
            "framework": "torch",
            # Use GPUs iff `RLLIB_NUM_GPUS` env var set to > 0.
            "num_gpus": int(os.environ.get("RLLIB_NUM_GPUS", "0")),
            # TODO(avnishn): This example uses functions specific to episode v1
            # that is not compatible with episode v2. Needs to be updated
            "enable_connectors": False,
        },
    )
    # there is only one trial involved.
    result = tuner.fit().get_best_result()

    # Verify episode-related custom metrics are there.
    custom_metrics = result.metrics["custom_metrics"]
    print(custom_metrics)
    assert "pole_angle_mean" in custom_metrics
    assert "pole_angle_min" in custom_metrics
    assert "pole_angle_max" in custom_metrics
    assert "num_batches_mean" in custom_metrics
    assert "callback_ok" in result.metrics

2023-04-23 08:27:06,717	INFO worker.py:1382 -- Calling ray.init() again after it has already been called.


0,1
Current time:,2023-04-23 08:27:15
Running for:,00:00:08.52
Memory:,15.3/15.7 GiB

Trial name,status,loc,iter,total time (s),ts,reward,episode_reward_max,episode_reward_min,episode_len_mean
PG_CartPole-v1_de7e6_00000,TERMINATED,127.0.0.1:22772,10,1.24064,2000,26.5946,78,10,26.5946




[2m[36m(PG pid=22772)[0m episode 243690006713247071 (env-idx=0) started.
[2m[36m(PG pid=22772)[0m episode 474701696523161799 (env-idx=1) started.
[2m[36m(PG pid=22772)[0m postprocessed 14 steps
[2m[36m(PG pid=22772)[0m episode 474701696523161799 (env-idx=1) ended with length 14 and pole angles 0.11169251054525375
[2m[36m(PG pid=22772)[0m episode 900463818452346912 (env-idx=1) started.
[2m[36m(PG pid=22772)[0m postprocessed 23 steps
[2m[36m(PG pid=22772)[0m episode 243690006713247071 (env-idx=0) ended with length 23 and pole angles 0.10716638714075089
[2m[36m(PG pid=22772)[0m episode 931551982301474348 (env-idx=0) started.
[2m[36m(PG pid=22772)[0m postprocessed 29 steps
[2m[36m(PG pid=22772)[0m episode 900463818452346912 (env-idx=1) ended with length 29 and pole angles 0.06946299970149994
[2m[36m(PG pid=22772)[0m episode 46412943169667800 (env-idx=1) started.
[2m[36m(PG pid=22772)[0m postprocessed 24 steps
[2m[36m(PG pid=22772)[0m episode 931551982

Trial name,agent_timesteps_total,callback_ok,connector_metrics,counters,custom_metrics,date,done,episode_len_mean,episode_media,episode_reward_max,episode_reward_mean,episode_reward_min,episodes_this_iter,episodes_total,experiment_id,hostname,info,iterations_since_restore,node_ip,num_agent_steps_sampled,num_agent_steps_trained,num_env_steps_sampled,num_env_steps_sampled_this_iter,num_env_steps_trained,num_env_steps_trained_this_iter,num_faulty_episodes,num_healthy_workers,num_in_flight_async_reqs,num_remote_worker_restarts,num_steps_trained_this_iter,perf,pid,policy_reward_max,policy_reward_mean,policy_reward_min,sampler_perf,sampler_results,time_since_restore,time_this_iter_s,time_total_s,timers,timestamp,timesteps_since_restore,timesteps_total,training_iteration,trial_id,warmup_time
PG_CartPole-v1_de7e6_00000,2000,True,{},"{'num_env_steps_sampled': 2000, 'num_env_steps_trained': 2000, 'num_agent_steps_sampled': 2000, 'num_agent_steps_trained': 2000}","{'num_batches_mean': 1.2297297297297298, 'num_batches_min': 1, 'num_batches_max': 2, 'pole_angle_mean': 0.08164537, 'pole_angle_min': 0.03770415, 'pole_angle_max': 0.124951355}",2023-04-23_08-27-14,True,26.5946,{},78,26.5946,10,6,74,21b3001429664728806650d7e6654cf7,DESKTOP-U8A332F,"{'learner': {'default_policy': {'learner_stats': {'allreduce_latency': 0.0, 'policy_loss': 10.180950164794922, 'cur_lr': 0.0004}, 'model': {}, 'custom_metrics': {'sum_actions_in_train_batch': 98.0}, 'num_agent_steps_trained': 200.0, 'num_grad_updates_lifetime': 10.0, 'diff_num_grad_updates_vs_sampler_policy': 0.0}}, 'num_env_steps_sampled': 2000, 'num_env_steps_trained': 2000, 'num_agent_steps_sampled': 2000, 'num_agent_steps_trained': 2000}",10,127.0.0.1,2000,2000,2000,200,2000,200,0,0,0,0,200,{},22772,{},{},{},"{'mean_raw_obs_processing_ms': 0.28717190123902475, 'mean_inference_ms': 0.7847068388578435, 'mean_action_processing_ms': 0.11854633483138652, 'mean_env_wait_ms': 0.061531060757738516, 'mean_env_render_ms': 0.0}","{'episode_reward_max': 78.0, 'episode_reward_min': 10.0, 'episode_reward_mean': 26.594594594594593, 'episode_len_mean': 26.594594594594593, 'episode_media': {}, 'episodes_this_iter': 6, 'policy_reward_min': {}, 'policy_reward_max': {}, 'policy_reward_mean': {}, 'custom_metrics': {'num_batches_mean': 1.2297297297297298, 'num_batches_min': 1, 'num_batches_max': 2, 'pole_angle_mean': 0.08164537, 'pole_angle_min': 0.03770415, 'pole_angle_max': 0.124951355}, 'hist_stats': {'pole_angles': [0.028003916, 0.033767235, 0.045558188, 0.06341165, 0.07570471, 0.082556635, 0.095719814, 0.103571236, 0.11784789, 0.13859263, 0.16588207, 0.18824515, 0.20588036, 0.2189537, 0.023664033, 0.029359506, 0.02935245, 0.03538139, 0.047446202, 0.053884376, 0.054775532, 0.061850395, 0.07511406, 0.08292602, 0.09704575, 0.105856076, 0.12109897, 0.13119014, 0.1362373, 0.14790475, 0.15463515, 0.15651295, 0.1651347, 0.16896564, 0.1795943, 0.19703893, 0.20985813, 0.037160896, 0.031291228, 0.03150491, 0.037766375, 0.05007683, 0.056776233, 0.057946026, 0.05363096, 0.043838773, 0.04022842, 0.031047313, 0.027967943, 0.030934848, 0.02822715, 0.031565048, 0.029230021, 0.032944433, 0.04269402, 0.046801195, 0.057025153, 0.07339024, 0.084271014, 0.089778066, 0.10164566, 0.11990442, 0.14461961, 0.17588906, 0.20227261, 0.22399864, 0.04420556, 0.05000091, 0.05022786, 0.04492487, 0.034093335, 0.029391654, 0.019055234, 0.0030532554, 0.018681288, 0.034543045, 0.04466984, 0.060863946, 0.07149197, 0.08834446, 0.09980953, 0.11765769, 0.13031156, 0.13789673, 0.14050345, 0.1497664, 0.16569859, 0.17678931, 0.19467935, 0.21942201, 0.019804941, 0.025516666, 0.025500963, 0.019794777, 0.008397944, 0.0029781663, 0.0082420595, 0.013589891, 0.013136283, 0.0069153877, 0.005075735, 0.022876792, 0.04656333, 0.06454137, 0.08865836, 0.11901919, 0.15575978, 0.19904351, 0.24905609, 0.015950289, 0.02267978, 0.023657057, 0.0189255, 0.008491381, 0.004028985, 0.0054735737, 0.0010899822, 0.009112636, 0.01345473, 0.023707693, 0.039898504, 0.050386664, 0.0669745, 0.08972423, 0.118732214, 0.14247312, 0.17276236, 0.19815105, 0.2188601, 0.027991919, 0.021738986, 0.009811543, 0.007831036, 0.031265263, 0.06060204, 0.08428372, 0.10250365, 0.12708235, 0.14648326, 0.17247918, 0.19360563, 0.22156164, 0.017627543, 0.011716289, 6.3601576e-05, 0.005662075, 0.017241009, 0.034709167, 0.05813839, 0.087634794, 0.123336405, 0.16540979, 0.20244008, 0.24625339, 0.015087558, 0.02140937, 0.021973446, 0.028524723, 0.041066613, 0.04793721, 0.049218696, 0.044956554, 0.046850286, 0.04318067, 0.033960197, 0.019164408, 0.010432103, 0.0076730386, 0.00087349734, 0.015225117, 0.035435893, 0.06159516, 0.08212675, 0.09720384, 0.106965914, 0.11151729, 0.12255699, 0.14010935, 0.15262616, 0.17180939, 0.1977222, 0.2189481, 0.029048484, 0.0352837, 0.035851274, 0.04249091, 0.05520594, 0.074036084, 0.09905634, 0.13037509, 0.16813117, 0.20089637, 0.22894312, 0.022204533, 0.01717559, 0.018138712, 0.025062876, 0.03795398, 0.056854464, 0.0818422, 0.113028646, 0.15055613, 0.18297224, 0.21054393, 0.033215854, 0.03942207, 0.051687695, 0.07005, 0.094581686, 0.1137146, 0.12761687, 0.14804326, 0.17506714, 0.20879297, 0.24935262, 0.01622137, 0.02284668, 0.035427064, 0.04229943, 0.043545708, 0.050906446, 0.06438897, 0.08403682, 0.10992852, 0.14217551, 0.18091908, 0.21475402, 0.038438346, 0.03221198, 0.020379271, 0.0028992703, 0.020304866, 0.037637193, 0.049244914, 0.06693859, 0.079096176, 0.08583636, 0.09890733, 0.10668896, 0.10927193, 0.11834179, 0.13391225, 0.1560317, 0.18478149, 0.20872857, 0.23956443, 0.028447758, 0.035087384, 0.036055453, 0.043094397, 0.044511355, 0.04035269, 0.030627705, 0.027005171, 0.017725322, 0.014466893, 0.017172897, 0.014117224, 0.017022565, 0.014163986, 0.005560119, 0.0028985352, 0.0061255884, 0.015224561, 0.030215682, 0.0511555, 0.07813557, 0.09959064, 0.11570223, 0.12661844, 0.14407028, 0.15651524, 0.1640789, 0.16685197, 0.16488987, 0.16973437, 0.18137524, 0.18832064, 0.19065702, 0.18843617, 0.18167542, 0.1818284, 0.17737517, 0.17980345, 0.17759383, 0.18225585, 0.19377829, 0.2006971, 0.21455565, 0.015088615, 0.009775596, 0.010410649, 0.016960723, 0.029429754, 0.0478583, 0.060621038, 0.079531014, 0.092980266, 0.112762034, 0.12730196, 0.14836067, 0.17601493, 0.19881219, 0.2284557, 0.041974235, 0.036993314, 0.02642932, 0.010249319, 8.6873115e-05, 0.015864281, 0.03766855, 0.06542518, 0.0992662, 0.12767488, 0.16252331, 0.19236392, 0.21744777, 0.017874148, 0.024709927, 0.02580584, 0.032909267, 0.046026833, 0.065201625, 0.09051203, 0.110391, 0.12501118, 0.14613709, 0.16224347, 0.1850469, 0.20309584, 0.22803816, 0.016205817, 0.011251405, 0.012251996, 0.019176818, 0.020325754, 0.015743261, 0.0054367124, 0.0010822064, 0.00909156, 0.02511216, 0.04704334, 0.07498362, 0.097371675, 0.11439471, 0.12620683, 0.13292754, 0.13464081, 0.13139476, 0.12320149, 0.121629216, 0.12663442, 0.13820834, 0.15637709, 0.1812005, 0.21277, 0.012615274, 0.018095797, 0.01780277, 0.011771362, 3.558869e-07, 0.01755111, 0.029248208, 0.03520325, 0.035491947, 0.030153222, 0.03088775, 0.03766312, 0.050483707, 0.057692524, 0.05937441, 0.055577546, 0.046313133, 0.03155552, 0.022935731, 0.020365164, 0.023791192, 0.033197965, 0.036902934, 0.046667263, 0.050815035, 0.06110343, 0.077556886, 0.08855323, 0.10587109, 0.12957214, 0.1597513, 0.19653378, 0.24007112, 0.017236246, 0.022944177, 0.022908162, 0.01716502, 0.017418258, 0.023632474, 0.03580919, 0.042282965, 0.043133173, 0.03840242, 0.03979107, 0.04727067, 0.049152758, 0.045486797, 0.04797633, 0.056599453, 0.07137083, 0.08065527, 0.0845525, 0.094789654, 0.111388505, 0.13440588, 0.15230764, 0.16525753, 0.1849375, 0.19988644, 0.21025026, 0.04277667, 0.03657414, 0.024793781, 0.007394598, 0.003997107, 0.009488746, 0.009151993, 0.014728473, 0.0145093035, 0.008530139, 0.0032104624, 0.020750739, 0.03245758, 0.03844292, 0.03878282, 0.04521392, 0.057738155, 0.07639385, 0.101254605, 0.12075921, 0.13507907, 0.15596135, 0.18348071, 0.2061976, 0.22431484, 0.0018039389, 0.004649341, 0.0052375956, 0.011708775, 0.024066554, 0.042351283, 0.054935556, 0.061938826, 0.06344476, 0.05950039, 0.06179607, 0.058625083, 0.0616845, 0.059271373, 0.05140621, 0.0380726, 0.0309073, 0.029830817, 0.023098866, 0.010704342, 0.007396569, 0.031283464, 0.0610702, 0.096902646, 0.12727323, 0.16406964, 0.20745309, 0.24607925, 0.019378377, 0.024583664, 0.03576358, 0.041246746, 0.052804813, 0.058774695, 0.059233118, 0.06590419, 0.078790426, 0.0979304, 0.11173187, 0.12032699, 0.13543633, 0.15710557, 0.17382877, 0.18576312, 0.20453756, 0.21873127, 0.0139340535, 0.0077407993, 0.004217578, 0.010273733, 0.02221009, 0.040064473, 0.06391048, 0.093855806, 0.118359886, 0.13762672, 0.16344154, 0.1959046, 0.2236156, 0.00021112934, 0.0064237677, 0.0072036744, 0.013877637, 0.026450515, 0.044963814, 0.06949464, 0.10015397, 0.12540908, 0.14546996, 0.16051453, 0.18225299, 0.2107603, 0.016884068, 0.022078017, 0.03323117, 0.050375447, 0.0735786, 0.10294262, 0.12693019, 0.15737958, 0.18281858, 0.21500844, 0.00926911, 0.0034220526, 0.003486831, 0.0022804157, 0.0021720508, 0.007931717, 0.00785144, 0.013674662, 0.02540086, 0.031360175, 0.04333118, 0.06135006, 0.07379386, 0.09246478, 0.11743429, 0.13715687, 0.16342226, 0.19633317, 0.22449155, 0.029858042, 0.024264267, 0.024709461, 0.019456064, 0.008506908, 0.0035327307, 0.004465633, 0.00043278892, 0.0005505519, 0.0043224962, 0.0033384135, 0.0034719894, 0.016114958, 0.022926178, 0.023986239, 0.019339053, 0.020694897, 0.016320357, 0.006224144, 0.009621978, 0.031282466, 0.047149993, 0.05736392, 0.062028658, 0.061212372, 0.0666279, 0.07827031, 0.09617082, 0.120395824, 0.13939956, 0.15335208, 0.1623895, 0.16661319, 0.17762056, 0.19543189, 0.20860316, 0.21726762, 0.041857496, 0.04795421, 0.048467048, 0.043436375, 0.044557057, 0.040104378, 0.041779663, 0.049556177, 0.05174823, 0.06009822, 0.0629296, 0.0719814, 0.08726993, 0.10884718, 0.12514302, 0.13630767, 0.1540592, 0.17845547, 0.19803743, 0.21298459, 0.030755885, 0.03595038, 0.035488367, 0.029403817, 0.017693605, 0.012019366, 0.012309335, 0.006821973, 0.0072654053, 0.013605389, 0.014137714, 0.008902852, 0.009610157, 0.016227033, 0.017051172, 0.023830473, 0.03656999, 0.043607827, 0.04502705, 0.040874038, 0.04285182, 0.03923936, 0.03004964, 0.026955694, 0.018200677, 0.015466797, 0.006995202, 0.007231737, 0.015561144, 0.018082665, 0.014849521, 0.0058778995, 0.008853029, 0.017693419, 0.032443017, 0.041451365, 0.056514323, 0.06599016, 0.08166491, 0.09191541, 0.09684847, 0.09653485, 0.091008745, 0.08026779, 0.06427329, 0.054615103, 0.051201463, 0.05397582, 0.051228173, 0.04297697, 0.029203715, 0.009853473, 0.0034625256, 0.010863143, 0.012431976, 0.008216093, 0.00993178, 0.0058458773, 0.0076759607, 0.015396475, 0.029018853, 0.048591036, 0.06249465, 0.082549766, 0.09715647, 0.10645113, 0.12217892, 0.13275899, 0.14991002, 0.1620977, 0.16944611, 0.17204443, 0.18146244, 0.18620242, 0.18633437, 0.19336967, 0.20730834, 0.21672459, 0.0015375369, 0.0071083964, 0.006835304, 0.000753578, 0.011138537, 0.02887956, 0.04083737, 0.04712622, 0.047824472, 0.042973734, 0.032578547, 0.028301539, 0.018379916, 0.0027856708, 0.0068404027, 0.02230255, 0.04366124, 0.059307918, 0.081076466, 0.09737503, 0.1083512, 0.1257615, 0.13803683, 0.15690215, 0.17084105, 0.17999059, 0.19596592, 0.2188106, 0.0061715823, 0.0011940409, 0.009598099, 0.01452906, 0.013667219, 0.018750006, 0.029772038, 0.04676469, 0.06979523, 0.08727257, 0.1110256, 0.1294966, 0.15447581, 0.17446546, 0.20119388, 0.22325419, 0.041383337, 0.0350242, 0.034773882, 0.028894966, 0.017385729, 0.011909368, 0.00069002475, 0.016307462, 0.03915427, 0.06795611, 0.102851085, 0.1323302, 0.15663193, 0.18755469, 0.225221, 0.0133601995, 0.019823028, 0.020517059, 0.027188504, 0.039841585, 0.05851706, 0.0715945, 0.07919799, 0.08141592, 0.08996547, 0.10485897, 0.12614417, 0.14226903, 0.15338404, 0.17117722, 0.18415429, 0.19244604, 0.20763014, 0.21828452, 0.017929332, 0.013038666, 0.014113679, 0.009417876, 0.010664096, 0.0061163832, 0.0042173318, 0.008658966, 0.007273608, 8.9480534e-05, 0.012902258, 0.03174709, 0.044819903, 0.06394288, 0.077500425, 0.08562026, 0.100061595, 0.10921187, 0.12481157, 0.1352828, 0.15233923, 0.17603524, 0.19490492, 0.20912246, 0.23028308, 0.03211191, 0.038557652, 0.051056083, 0.06964597, 0.08271162, 0.10205278, 0.11608203, 0.13657098, 0.15197797, 0.17403188, 0.1912577, 0.20381747, 0.2118397, 0.026982907, 0.021568963, 0.010473985, 0.0063371947, 0.02893579, 0.05742766, 0.08024952, 0.09758869, 0.10959964, 0.12804574, 0.14136529, 0.16128686, 0.18787903, 0.20970765, 0.01728918, 0.011181164, 0.011034846, 0.0051058433, 0.005099693, 0.00072780985, 0.012376716, 0.018176552, 0.029907597, 0.0359006, 0.047932867, 0.06604056, 0.09029536, 0.109124586, 0.12269381, 0.13113442, 0.13454255, 0.13297851, 0.13805291, 0.13816811, 0.14494044, 0.14679036, 0.14376682, 0.14744636, 0.15781306, 0.17488523, 0.18717353, 0.19480383, 0.19786775, 0.19642244, 0.19049081, 0.19151193, 0.18799196, 0.19140121, 0.20172246, 0.2189711, 0.0088475635, 0.0032716158, 0.0036048729, 0.0018948481, 0.0015182146, 0.0070071844, 0.0066520805, 0.012194687, 0.023632765, 0.041000832, 0.064369276, 0.08214668, 0.10616815, 0.124872655, 0.15005852, 0.17022221, 0.18554488, 0.19617446, 0.20222488, 0.2037759, 0.21230806, 0.047829762, 0.042838644, 0.043995075, 0.0395742, 0.029583588, 0.025690721, 0.01613374, 0.0008872317, 0.020110535, 0.046956386, 0.07978037, 0.11874307, 0.1523673, 0.18092208, 0.20464799, 0.22375487, 0.042789806, 0.048368514, 0.0483695, 0.042829722, 0.043440696, 0.050169326, 0.063019134, 0.08202995, 0.10727674, 0.1272054, 0.15362118, 0.17503059, 0.19162405, 0.20355903, 0.21095937, 0.019380094, 0.025071876, 0.036738295, 0.042711098, 0.054764688, 0.07293477, 0.09729245, 0.11627081, 0.13003722, 0.13872492, 0.14243208, 0.15279979, 0.15827496, 0.15893297, 0.16635376, 0.1805401, 0.19000554, 0.2063452, 0.2181366, 0.03907157, 0.045816608, 0.046959434, 0.054237846, 0.05596598, 0.06387991, 0.06630332, 0.06328943, 0.054854527, 0.05265851, 0.0449648, 0.043447293, 0.048060257, 0.047099862, 0.052288484, 0.051927846, 0.046052452, 0.03465978, 0.029403672, 0.03021577, 0.025362615, 0.026550628, 0.03375016, 0.0469684, 0.054549284, 0.056579936, 0.053110864, 0.055841427, 0.053062674, 0.056479204, 0.06607452, 0.070182614, 0.08054616, 0.08551437, 0.09682181, 0.10283798, 0.10364123, 0.09927351, 0.089740284, 0.07501071, 0.05501823, 0.041331068, 0.02214657, 0.009069589, 0.0019840794, 0.00080914906, 0.0055003837, 0.004343067, 0.009074016, 0.019685958, 0.0245017, 0.023589263, 0.028683059, 0.028073851, 0.021794707, 0.0098415855, 0.007826314, 0.03128567, 0.06064755, 0.09605521, 0.137681, 0.17407675, 0.21711448, 0.008736902, 0.014687999, 0.014840802, 0.009233351, 0.009572429, 0.004116397, 0.004574099, 0.0007958252, 0.00028330734, 0.006077845, 0.0065835523, 0.012981147, 0.013566751, 0.008381173, 0.009134215, 0.0040867208, 0.006756532, 0.023427634, 0.03428773, 0.051147252, 0.07407208, 0.103162386, 0.13855018, 0.1687599, 0.1940413, 0.21461403, 0.019965485, 0.01418447, 0.002677061, 0.0028879996, 0.0142898075, 0.019856183, 0.019659718, 0.013736203, 0.0020843232, 0.015334045, 0.03859295, 0.056095134, 0.067991234, 0.074397355, 0.08707, 0.09437551, 0.10805739, 0.12815605, 0.14311695, 0.16468003, 0.1813518, 0.1932896, 0.20061696, 0.21488163, 0.048376936, 0.053580374, 0.053243008, 0.04739948, 0.04773572, 0.054217026, 0.06684526, 0.07397094, 0.08735642, 0.1070424, 0.13310425, 0.16564974, 0.193227, 0.2160716, 0.0012705617, 0.007981733, 0.02055457, 0.039031126, 0.0634891, 0.08234303, 0.095755406, 0.10385453, 0.118379064, 0.1277381, 0.14364767, 0.16615689, 0.19534755, 0.23133114, 0.0042613237, 0.010593403, 0.011098762, 0.017524248, 0.02987298, 0.036479462, 0.037423648, 0.03274876, 0.034158845, 0.029925464, 0.020057784, 0.01622934, 0.006675126, 0.008629568, 0.018038746, 0.021648914, 0.03122545, 0.035086352, 0.0449946, 0.049274404, 0.04799107, 0.041172966, 0.0405033, 0.034245368, 0.034090962, 0.028302865, 0.016879987, 0.00021556772, 0.011352272, 0.016636675, 0.027845915, 0.045012705, 0.056503523, 0.062430944, 0.062871546, 0.06954633, 0.07077685, 0.06660827, 0.057048816, 0.053747572, 0.044963248, 0.042361517, 0.045890234, 0.043838467, 0.047922716, 0.05813063, 0.062794454, 0.061982386, 0.067406625, 0.079062276, 0.08530372, 0.08621038, 0.08182511, 0.072154, 0.057166617, 0.03679659, 0.010942581, 0.008831988, 0.022684565, 0.042446144, 0.056498274, 0.064969905, 0.07964043, 0.10055902, 0.11614445, 0.12654132, 0.14347634, 0.15540408, 0.16244642, 0.17623618, 0.1852768, 0.20117031, 0.21248083, 0.009699267, 0.0035125688, 0.008466296, 0.014569416, 0.026579354, 0.044534016, 0.056804456, 0.06350829, 0.076412946, 0.08387706, 0.09765646, 0.11779319, 0.14436358, 0.177476, 0.21726748, 0.041687742, 0.03614519, 0.036713324, 0.0316602, 0.03268773, 0.0397653, 0.041198883, 0.04873165, 0.06237208, 0.07047349, 0.073127195, 0.08206206, 0.09729309, 0.11887082, 0.14687976, 0.18143591, 0.21111992, 0.014498949, 0.00944328, 0.010332025, 0.017133715, 0.029853867, 0.048534602, 0.06155225, 0.06902963, 0.07105386, 0.07935085, 0.09393205, 0.103179425, 0.1071936, 0.10603906, 0.11137427, 0.1231926, 0.14152266, 0.15482138, 0.1747938, 0.20150673, 0.22355397, 0.036077186, 0.042595685, 0.043492366, 0.03881014, 0.04024948, 0.04778224, 0.04972049, 0.04611408, 0.048666548, 0.05735637, 0.060507126, 0.058176864, 0.05038667, 0.037120726, 0.018326744, 0.0056150067, 0.012833843, 0.02539385, 0.032181583, 0.03327795, 0.040427525, 0.053636853, 0.061252497, 0.06336213, 0.07169899, 0.07459479, 0.07210599, 0.06425223, 0.051016353, 0.04402452, 0.031509303, 0.025118414, 0.024776543, 0.030444693, 0.042120706, 0.04813794, 0.048573032, 0.055157606, 0.05620261, 0.06343887, 0.07687237, 0.084864795, 0.08750741, 0.0965141, 0.10024345, 0.11040283, 0.1270125, 0.13850176, 0.14498849, 0.14655524, 0.14324889, 0.14664435, 0.15672429, 0.17350556, 0.1854952, 0.19281684, 0.20703766, 0.22819144, 0.009127646, 0.0026779028, 0.0021391078, 0.0074708452, 0.0069624335, 0.012354635, 0.01193726, 0.017450988, 0.017186835, 0.02288543, 0.022839764, 0.017086588, 0.0056255567, 0.00012485261, 0.011193918, 0.016658243, 0.028046416, 0.033686817, 0.033653073, 0.027981997, 0.016673282, 0.00031018798, 0.02304153, 0.039921157, 0.05109381, 0.06836622, 0.080114834, 0.09813167, 0.11081923, 0.12994486, 0.14395224, 0.16457164, 0.1803061, 0.19130617, 0.2091789, 0.23397565, 0.045125186, 0.051244088, 0.0634943, 0.070222266, 0.07151016, 0.0674035, 0.057910938, 0.054681227, 0.0459742, 0.03176804, 0.023697732, 0.021677963, 0.02565948, 0.03562983, 0.03991044, 0.038566362, 0.043322343, 0.05417021, 0.05944359, 0.070902266, 0.076893345, 0.07749431, 0.07274595, 0.06265224, 0.047180526, 0.0379432, 0.034849335, 0.02614596, 0.023511821, 0.015191264, 0.0011671298, 0.0069084833, 0.009123083, 0.017234772, 0.019550607, 0.027827844, 0.030375965, 0.0389507, 0.04186635, 0.0391791, 0.042603686, 0.05212389, 0.056064956, 0.066179216, 0.08248969, 0.10505503, 0.12230613, 0.14603284, 0.16471998, 0.19010265, 0.2222735, 0.040903293, 0.046202194, 0.057607066, 0.063456394, 0.06382628, 0.07043635, 0.071608596, 0.06738774, 0.06945457, 0.06610773, 0.069036074, 0.0665421, 0.058645543, 0.045329317, 0.038224228, 0.0255581, 0.0189814, 0.01841734, 0.023825496, 0.023497302, 0.029171184, 0.040845074, 0.058553513, 0.08236672, 0.10070452, 0.11372829, 0.12156506, 0.12430638, 0.13361624, 0.13790487, 0.14882682, 0.16640393, 0.19069156, 0.2217765, 0.00283442, 0.008204803, 0.019446697, 0.03659372, 0.04801064, 0.053808887, 0.054063875, 0.048814226, 0.03806153, 0.033461943, 0.034951188, 0.04250143, 0.05612157, 0.07585681, 0.10178743, 0.12235798, 0.13774714, 0.15970711, 0.1883178, 0.21215227, 0.028588096, 0.035199687, 0.036140632, 0.031454127, 0.032844823, 0.028583614, 0.030379605, 0.026505006, 0.028672596, 0.036858704, 0.03937467, 0.047972225, 0.0626664, 0.07181643, 0.08720163, 0.09720185, 0.11357887, 0.12474397, 0.13081205, 0.13186245, 0.13953133, 0.14223278, 0.14002195, 0.13291822, 0.13248155, 0.12708549, 0.12831661, 0.124546915, 0.1273822, 0.1368022, 0.15282144, 0.16390647, 0.18172474, 0.20633094, 0.22632343, 0.028278042, 0.034419533, 0.034888376, 0.029724665, 0.030630555, 0.037574667, 0.0388614, 0.034536235, 0.02460756, 0.009046846, 0.012210673, 0.02755802, 0.03712905, 0.041022647, 0.039301388, 0.04368689, 0.054168724, 0.0590785, 0.05848594, 0.06410782, 0.06425613, 0.07064847, 0.083285496, 0.090530045, 0.10412938, 0.12412384, 0.1389533, 0.14875904, 0.1536475, 0.16524915, 0.17203861, 0.174101, 0.17148636, 0.17571487, 0.17526215, 0.17015941, 0.16040301, 0.15746883, 0.14977276, 0.14883466, 0.14305788, 0.1439946, 0.14004438, 0.1427825, 0.14061202, 0.14512362, 0.15630567, 0.16261432, 0.16413102, 0.16090198, 0.15293816, 0.14021543, 0.13422614, 0.13490507, 0.14222077, 0.1445907, 0.14206766, 0.13466859, 0.13394733, 0.12827915, 0.12924595, 0.13681765, 0.1509989, 0.1602466, 0.16466354, 0.17585316, 0.1823105, 0.18411833, 0.19281025, 0.20839429, 0.23091069, 0.0012662128, 0.0075884494, 0.00806502, 0.014442939, 0.015018286, 0.021537725, 0.022298979, 0.029048229, 0.041790087, 0.060565695, 0.085451625, 0.11655802, 0.14236748, 0.17471264, 0.213727, 0.029170077, 0.023853749, 0.024572197, 0.0195894, 0.020613223, 0.027613018, 0.040595032, 0.059602022, 0.08471213, 0.10435354, 0.13035582, 0.15119256, 0.1670476, 0.1780715, 0.19590156, 0.20909485, 0.21778479, 0.029508086, 0.02420619, 0.024941137, 0.019977115, 0.009318838, 0.004638763, 0.005870843, 0.0012786078, 0.0025769526, 0.0019702876, 0.00064763415, 0.006516232, 0.01952967, 0.026730632, 0.028202366, 0.02399148, 0.02580948, 0.033630572, 0.047465812, 0.06736261, 0.08171128, 0.09064511, 0.10592455, 0.11594717, 0.120819554, 0.1322297, 0.13859363, 0.15158328, 0.17123124, 0.18604937, 0.20769359, 0.2362342, 0.03042327, 0.025667757, 0.02695468, 0.034254994, 0.035874043, 0.043558903, 0.04562057, 0.053804263, 0.06812214, 0.08862245, 0.10371196, 0.11353084, 0.12981938, 0.15263048, 0.17045528, 0.18345854, 0.19177118, 0.19548988, 0.1946768, 0.18935972, 0.17953224, 0.17662232, 0.18058266, 0.19139864, 0.20908868, 0.23370332, 0.042436436, 0.03658406, 0.036846865, 0.03149128, 0.020518953, 0.0155953495, 0.00494893, 0.0002536287, 0.0014431245, 0.0032194376, 0.013726547, 0.030107569, 0.040721912, 0.04567533, 0.056733638, 0.062232953, 0.062247, 0.05681272, 0.045930065, 0.04124798, 0.042702086, 0.038568415, 0.028856488, 0.013538917, 0.00425377, 0.0009070124, 0.0034406912, 0.00012643707, 0.0026875106, 0.00060427655, 0.0019745273, 0.010403176, 0.024697918, 0.044911448, 0.059428453, 0.08007492, 0.10693605, 0.12846532, 0.14484857, 0.16783524, 0.18594229, 0.19933772, 0.20815605, 0.2239406, 0.015818365, 0.011004414, 0.00043742932, 0.015913459, 0.026407938, 0.031149892, 0.030207096, 0.023610411, 0.0230548, 0.01679637, 0.004831458, 0.001174934, 0.0012972712, 0.0072806766, 0.019125918, 0.025163544, 0.037174232, 0.04349188, 0.055892948, 0.07441516, 0.08744522, 0.10677842, 0.13248807, 0.16468003, 0.20348959, 0.23755065, 0.036635958, 0.04316592, 0.044077717, 0.051109187, 0.06426565, 0.071898885, 0.074097164, 0.08258488, 0.08570391, 0.08351236, 0.07603158, 0.07490686, 0.08009554, 0.09159096, 0.109422415, 0.13365412, 0.16438323, 0.20173696, 0.23434138, 0.00014140175, 0.0064533027, 0.0069124373, 0.013265812, 0.013809287, 0.0085833995, 0.00929764, 0.015919454, 0.01674654, 0.0118212635, 0.0011489092, 0.0035957617, 0.0024795304, 0.007239604, 0.0061616823, 0.00072404, 0.013424433, 0.02027573, 0.03306474, 0.040129166, 0.041552067, 0.037379835, 0.027621776, 0.012250283, 0.002903679, 0.012218858, 0.02146949, 0.02494399, 0.022701822, 0.0147654535, 0.0011202861, 0.0065789865, 0.00841754, 0.004444094, 0.0063771745, 0.0024847046, 0.0072210534, 0.022764787, 0.044207443, 0.059941046, 0.08179978, 0.09819274, 0.12093067, 0.13846174, 0.16255529, 0.18172319, 0.19614068, 0.21743669, 0.020749433, 0.026643563, 0.038520776, 0.044714533, 0.04530249, 0.040325522, 0.041480973, 0.03704258, 0.027017888, 0.011377538, 0.0017583745, 0.013642297, 0.023178255, 0.03865324, 0.060125917, 0.075992465, 0.08639546, 0.091442406, 0.091204755, 0.09736861, 0.10993239, 0.117286175, 0.11951802, 0.11667986, 0.108787395, 0.107436374, 0.112583905, 0.12422233, 0.14237916, 0.16711605, 0.18695484, 0.202076, 0.21262686, 0.0042674034, 0.01083356, 0.023280228, 0.02994187, 0.03089848, 0.026193338, 0.027533533, 0.023187626, 0.02486651, 0.020839835, 0.022821603, 0.03078706, 0.03304449, 0.041346617, 0.055707037, 0.064479716, 0.06776009, 0.06560716, 0.0697196, 0.06840629, 0.07336978, 0.07292634, 0.07878091, 0.07925906, 0.07440074, 0.06420906, 0.06032079, 0.06267706, 0.07125507, 0.08606837, 0.10716626, 0.13463235, 0.15695176, 0.17431915, 0.1984391, 0.21789156, 0.014388011, 0.019758815, 0.01936741, 0.013248329, 0.0013989961, 0.004513806, 0.0045641325, 0.010496532, 0.010604131, 0.016631253, 0.01687198, 0.023070376, 0.023522481, 0.018268272, 0.0073106284, 0.0023206307, 0.0032302297, 0.0016991679, 0.012461811, 0.017381513, 0.028232966, 0.033341296, 0.04447868, 0.04997617, 0.06160112, 0.06769547, 0.06833708, 0.07524369, 0.0767428, 0.07288138, 0.06366953, 0.049080696, 0.029052183, 0.0034861846, 0.016047087, 0.041412074, 0.061024766, 0.08674541, 0.11868902, 0.14534414, 0.16693307, 0.18364659, 0.1956425, 0.20304488, 0.20594361, 0.21582736, 0.00036131078, 0.005699436, 0.017611563, 0.023706045, 0.024058986, 0.018709725, 0.0076604933, 0.0091233365, 0.031712446, 0.048505407, 0.059647493, 0.07694081, 0.08876718, 0.09524376, 0.0964519, 0.09243646, 0.09485069, 0.09202194, 0.09561391, 0.10561059, 0.11038555, 0.121641316, 0.12777773, 0.14048281, 0.14819054, 0.16256765, 0.18365306, 0.19998722, 0.21172626, 0.015815545, 0.020994399, 0.032125838, 0.03753737, 0.0490017, 0.05485353, 0.06685988, 0.07336797, 0.07445863, 0.08184727, 0.09553993, 0.1039159, 0.11871603, 0.13998605, 0.15619229, 0.16748694, 0.18553221, 0.19886334, 0.20761438, 0.22332937, 0.048690245, 0.05435591, 0.05448282, 0.04910874, 0.038234394, 0.021823764, 0.011502318, 0.007170461, 0.008764382, 0.004550064, 0.006244439, 0.013821114, 0.015583639, 0.02328639, 0.025234558, 0.021477805, 0.012028716, 0.0085671125, 0.0110345725, 0.019409502, 0.033707254, 0.042274784, 0.05690463, 0.077648126, 0.10459144, 0.13785337, 0.16594814, 0.20069112, 0.24222179, 0.012738592, 0.018386653, 0.018261952, 0.01240074, 0.0125072505, 0.018545153, 0.018808808, 0.025041984, 0.025541311, 0.032050192, 0.03286867, 0.028039128, 0.017566849, 0.0014202264, 0.008763266, 0.013084155, 0.011606928, 0.004359176, 0.003037826, 0.0075975778, 0.0063228663, 0.010949561, 0.02146967, 0.026205523, 0.025224695, 0.018557847, 0.01790159, 0.011509923, 0.011083742, 0.016583402, 0.028006224, 0.03368079, 0.033680953, 0.03974345, 0.05186818, 0.058394827, 0.059403762, 0.0666231, 0.068374924, 0.07638547, 0.07898869, 0.087907314, 0.09149042, 0.101454906, 0.10616928, 0.10570293, 0.100088805, 0.10095592, 0.09663299, 0.09876495, 0.10732767, 0.11069065, 0.120544046, 0.12528044, 0.1365797, 0.15446655, 0.16741696, 0.17556073, 0.19051318, 0.20081168, 0.20656782, 0.2192979], 'episode_reward': [14.0, 23.0, 29.0, 24.0, 19.0, 20.0, 13.0, 12.0, 28.0, 11.0, 11.0, 11.0, 12.0, 19.0, 43.0, 15.0, 13.0, 14.0, 25.0, 33.0, 27.0, 25.0, 28.0, 18.0, 13.0, 13.0, 10.0, 19.0, 37.0, 20.0, 78.0, 28.0, 16.0, 15.0, 19.0, 25.0, 13.0, 14.0, 36.0, 21.0, 16.0, 15.0, 19.0, 63.0, 26.0, 24.0, 14.0, 14.0, 73.0, 15.0, 17.0, 21.0, 58.0, 36.0, 51.0, 34.0, 20.0, 35.0, 71.0, 15.0, 17.0, 32.0, 26.0, 44.0, 26.0, 19.0, 48.0, 33.0, 36.0, 46.0, 29.0, 20.0, 29.0, 62.0], 'episode_lengths': [14, 23, 29, 24, 19, 20, 13, 12, 28, 11, 11, 11, 12, 19, 43, 15, 13, 14, 25, 33, 27, 25, 28, 18, 13, 13, 10, 19, 37, 20, 78, 28, 16, 15, 19, 25, 13, 14, 36, 21, 16, 15, 19, 63, 26, 24, 14, 14, 73, 15, 17, 21, 58, 36, 51, 34, 20, 35, 71, 15, 17, 32, 26, 44, 26, 19, 48, 33, 36, 46, 29, 20, 29, 62]}, 'sampler_perf': {'mean_raw_obs_processing_ms': 0.28717190123902475, 'mean_inference_ms': 0.7847068388578435, 'mean_action_processing_ms': 0.11854633483138652, 'mean_env_wait_ms': 0.061531060757738516, 'mean_env_render_ms': 0.0}, 'num_faulty_episodes': 0, 'connector_metrics': {}}",1.24064,0.145749,1.24064,"{'training_iteration_time_ms': 123.265, 'load_time_ms': 0.3, 'load_throughput': 666291.342, 'learn_time_ms': 5.038, 'learn_throughput': 39700.554, 'synch_weights_time_ms': 0.0}",1682231234,0,2000,10,de7e6_00000,0.0624025


[2m[36m(PG pid=22772)[0m postprocessed 12 steps
[2m[36m(PG pid=22772)[0m episode 224906159115926065 (env-idx=1) ended with length 12 and pole angles 0.08085270971059799
[2m[36m(PG pid=22772)[0m episode 546051817624544973 (env-idx=1) started.
[2m[36m(PG pid=22772)[0m postprocessed 28 steps
[2m[36m(PG pid=22772)[0m episode 849675155454027208 (env-idx=0) ended with length 28 and pole angles 0.06950537860393524
[2m[36m(PG pid=22772)[0m episode 901692773908464672 (env-idx=0) started.
[2m[36m(PG pid=22772)[0m postprocessed 11 steps
[2m[36m(PG pid=22772)[0m episode 546051817624544973 (env-idx=1) ended with length 11 and pole angles 0.0999380424618721
[2m[36m(PG pid=22772)[0m episode 493934757727956784 (env-idx=1) started.
[2m[36m(PG pid=22772)[0m postprocessed 5 steps
[2m[36m(PG pid=22772)[0m postprocessed 2 steps
[2m[36m(PG pid=22772)[0m returned sample batch of size 200
[2m[36m(PG pid=22772)[0m policy.learn_on_batch() result: PGTorchPolicy -> sum actio

2023-04-23 08:27:15,335	INFO tune.py:798 -- Total run time: 8.61 seconds (8.36 seconds for the tuning loop).


{'num_batches_mean': 1.2297297297297298, 'num_batches_min': 1, 'num_batches_max': 2, 'pole_angle_mean': 0.08164537, 'pole_angle_min': 0.03770415, 'pole_angle_max': 0.124951355}
