## Installation and Imports

In [1]:
!pwd

/home/daniel/DARM/darm_mujoco/darm_training


In [2]:
# Configure env variables

# TODO: change path
import os
os.environ["DARM_MUJOCO_PATH"] = "/workspace/darm-mujoco"
os.getenv('DARM_MUJOCO_PATH')

'/home/daniel/DARM/darm_mujoco'

In [3]:
# Check if GCC is installed
!gcc --version

gcc (Ubuntu 7.5.0-3ubuntu1~18.04) 7.5.0
Copyright (C) 2017 Free Software Foundation, Inc.
This is free software; see the source for copying conditions.  There is NO
warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.



In [None]:
# Install GCC if absent
!sudo apt update
!sudo apt install build-essential -y

In [None]:
# # Setup Mujoco for gym - If needed
# !apt-get install -y \
#     libgl1-mesa-dev \
#     libgl1-mesa-glx \
#     libglew-dev \
#     libosmesa6-dev \
#     software-properties-common

# !apt-get install -y patchelf

# !pip install gym

# !pip install free-mujoco-py

# import mujoco_py
# import gym

In [3]:
!pip install ray[rllib] torch
!pip install wandb
!pip install tensorflow_probability



In [4]:
%%bash
cd ..
python setup.py install

/home/daniel/DARM/darm_mujoco
running install
running bdist_egg
running egg_info
writing darm_gym_env.egg-info/PKG-INFO
writing dependency_links to darm_gym_env.egg-info/dependency_links.txt
writing requirements to darm_gym_env.egg-info/requires.txt
writing top-level names to darm_gym_env.egg-info/top_level.txt
reading manifest file 'darm_gym_env.egg-info/SOURCES.txt'
writing manifest file 'darm_gym_env.egg-info/SOURCES.txt'
installing library code to build/bdist.linux-x86_64/egg
running install_lib
running build_py
creating build/bdist.linux-x86_64/egg
creating build/bdist.linux-x86_64/egg/darm_gym_env
copying build/lib/darm_gym_env/darm_sf_gym.py -> build/bdist.linux-x86_64/egg/darm_gym_env
copying build/lib/darm_gym_env/__init__.py -> build/bdist.linux-x86_64/egg/darm_gym_env
copying build/lib/darm_gym_env/multi_darm_gym.py -> build/bdist.linux-x86_64/egg/darm_gym_env
copying build/lib/darm_gym_env/darm_gym.py -> build/bdist.linux-x86_64/egg/darm_gym_env
copying build/lib/darm_gym_e

In [None]:
# Check if mujoco import is successful
import mujoco

In [None]:
# If mujoco import fails, update pandas and restart runtime
!pip install pandas -U

In [None]:
# # If GLFW is absent
# %%bash
# sudo apt-get install libglfw3 -y
# sudo apt-get install libglfw3-dev -y
# pip install --user glfw

In [1]:
import ray
from ray.rllib.algorithms.sac import SACConfig
from ray.tune.registry import register_env
from ray.tune.logger import pretty_print

from ray import air, tune
from ray.air import session
from ray.air.integrations.wandb import setup_wandb
from ray.air.integrations.wandb import WandbLoggerCallback

import gym
from darm_gym_env import DARMEnv

### TODO:
    - Change single_finger=False (In env register and config)
    - Change run_local_dir
    - Change run name, notes, and tags

## Register Environment with RLlib

In [2]:
def make_env(env_config):
    env = gym.wrappers.TimeLimit(env=DARMEnv(render_mode=None, action_time=0.08, hand_name="hand1", single_finger_env=False), max_episode_steps=200)
    env = gym.wrappers.TransformObservation(env, lambda obs: obs*100)
    return env

env_creator = lambda env_config: make_env(env_config)
register_env("darm/DarmHand-v0", env_creator)

## Configure Run

In [5]:
# TODO:
# change: rollout_workers
# change: gpu

config = (
    SACConfig()
    .environment(
        env="darm/DarmHand-v0",
        normalize_actions=True
    )
    .training(
        q_model_config={
            "fcnet_activation": "relu",
            "fcnet_hiddens": [128, 256, 256, 128] # [256, 256]
        },
        policy_model_config={
            "fcnet_activation": "relu",
            "fcnet_hiddens": [128, 256, 256, 128] # [256, 256]
        },
        tau=0.005,
        target_entropy="auto",
        n_step=1,  # num of SGD steps per batch of data in training step
        train_batch_size=256,
        target_network_update_freq=1,
        replay_buffer_config={"type":"MultiAgentPrioritizedReplayBuffer"},
        num_steps_sampled_before_learning_starts=40_000, # timesteps (transitions)
        optimization_config={
          "actor_learning_rate": 0.0003,
          "critic_learning_rate": 0.0003,
          "entropy_learning_rate": 0.0003,
        },
        clip_actions=False
    )
    .rollouts(
        num_rollout_workers=3,
        num_envs_per_worker=1,
        rollout_fragment_length=1,
        recreate_failed_workers=True,
        num_consecutive_worker_failures_tolerance=10,
        restart_failed_sub_environments=True,
        # batch_mode="complete_episodes"
    )
    .resources(num_gpus=0)
    .evaluation(evaluation_interval=100) # Training iterations
    .reporting(
        min_sample_timesteps_per_iteration=1000,
        metrics_num_episodes_for_smoothing=5
    )
    .framework(framework="torch")
)

In [6]:
# TODO:
# change: run name
# change: notes
# change: tags
# change: wandb config

run_name = "test1_MF_RLlib_SAC (done_all)"

notes = """
- The environment was updated such that the target is within a range from the start point
- Velocity penalty was removed and only effort penalty was used
- The reward function was updated according to the reach task reward used in facebookresearch/myosuite [https://github.com/facebookresearch/myosuite/blob/main/myosuite/envs/myo/reach_v0.py]
- The done signal is trigerred only when the fingertip goes beyond a threshold. The episode continues to the maximum timestep otherwise.
- The friction and damping coefficient of the environment is updated. Values are inspired from Deepmind's Mujoco Menagerie [https://github.com/deepmind/mujoco_menagerie/blob/main/shadow_hand/right_hand.xml]
- The range of action from the model was changed to [-1, 1]. This action is mapped to the actual action sent to mujoco e.g [0, 2]]. This change is inspired from values used in OpenAI's Gym Mujoco environments.
- max_episode_steps was updated to 200.
- Velocity vector (size [3,]) was added to observation. Observation size is now (9,)
- Action range was increased to [0, 5]
- Observation warpper to scale observation from m and m/s to cm and cm/s was applied
- Max Tension for Digitorum Extensor Communis was increased to 10
- FIXED: Velocity Observation from (prev_pos - new_pos)/time to (new_pos - prev_pos)/time
- FIXED: Removed weight of 1 from 'sparse', 'solved', and 'done' in reward weighting
- Reduced max_target_th to 5*0.004, 20 mm
- Changed done signal to be trigerred only when all fingers have exceeded the max_threshold
- Updated the penalty reward weight to 1 (from 50) for the `done_all` behaviour

- Five-Fingers; No Wrist Environment
- This run was trained on vast_ai using RLlib's SAC algo.
"""

tags = ["five_fingers", "done_all" "sac", "rllib", "vast_ai"]



wandb_init = dict(
    save_code=True,
    resume=True,
    config={
        "env": config.env,
        "num_rollout_workers": config.num_rollout_workers,
        "num_envs_per_worker": config.num_envs_per_worker,
        "recreate_failed_workers": config.recreate_failed_workers,
        "num_consecutive_worker_failures_tolerance": config.num_consecutive_worker_failures_tolerance,
        "restart_failed_sub_environments": config.restart_failed_sub_environments,
        "num_gpus": config.num_gpus,
        "framework": config.framework_str,
        
        "stop_episode_reward_mean": 1_300,
        "run_local_dir": f"{os.getenv('DARM_MUJOCO_PATH')}/darm_training/results/darm_mf_hand",
        
        "checkpoint_at_end": True,
        "checkpoint_score_attribute": "episode_reward_mean",  # or leave to save last chkpts
        "checkpoint_score_order": "max",
        "checkpoint_frequency": 10,   # iterations
        "num_checkpoints_to_keep": 3,
        "save_checkpoints_to_wandb": True
    },
    tags=tags,
    notes=notes,
    name=run_name
    # job_type=
    # monitor_gym=
)

In [7]:
!pwd

[Errno 2] No such file or directory: '/home/daniel/DARM/darm-mujoco/darm_training/'
/home/daniel/DARM/darm_mujoco/darm_training


## Run

In [8]:
# TODO: 
# change: name
# change: checkpoint_freq

sync_config = tune.SyncConfig()

tuner = tune.Tuner(
    "SAC",
    param_space=config,
    run_config=air.RunConfig(
        name=run_name,
        sync_config=sync_config,
        stop={"episode_reward_mean": wandb_init["config"]["stop_episode_reward_mean"]},
        
        local_dir=wandb_init["config"]["run_local_dir"],
        checkpoint_config=air.CheckpointConfig(
            checkpoint_at_end = wandb_init["config"]["checkpoint_at_end"],
            checkpoint_score_attribute = wandb_init["config"]["checkpoint_score_attribute"],  # or leave to save last chkpts
            checkpoint_score_order = wandb_init["config"]["checkpoint_score_order"],
            checkpoint_frequency = wandb_init["config"]["checkpoint_frequency"],
            num_to_keep = wandb_init["config"]["num_checkpoints_to_keep"]
        ),
        callbacks=[
                WandbLoggerCallback(project="DARM", 
                                    api_key="392c8a47eb0658eb5c71190757a69110e2140f4a",
                                    save_checkpoints=wandb_init["config"]["save_checkpoints_to_wandb"], 
                                    **wandb_init)
            ],
        )
    
)

results = tuner.fit()

2023-03-04 22:05:16,324	INFO worker.py:1538 -- Started a local Ray instance.


0,1
Current time:,2023-03-04 22:13:18
Running for:,00:08:00.60
Memory:,5.5/7.5 GiB

Trial name,status,loc,iter,total time (s),ts,reward,episode_reward_max,episode_reward_min,episode_len_mean
SAC_darm_DarmHand-v0_441d8_00000,RUNNING,192.168.93.36:8473,24,448.089,24048,-11.3509,-1.72362,-38.8535,2.39524


[2m[36m(SAC pid=8473)[0m 2023-03-04 22:05:22,519	INFO algorithm.py:501 -- Current log_level is WARN. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[34m[1mwandb[0m: Currently logged in as: [33mdanieladejumo[0m. Use [1m`wandb login --relogin`[0m to force relogin
[2m[33m(raylet)[0m [2023-03-04 22:05:25,218 E 8212 8264] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-03-04_22-05-12_873660_8091 is over 95% full, available space: 309374976; capacity: 31845081088. Object creation will fail if spilling is required.


[2m[36m(RolloutWorker pid=8578)[0m Loaded XML file successfully
[2m[36m(RolloutWorker pid=8579)[0m Loaded XML file successfully
[2m[36m(RolloutWorker pid=8577)[0m Loaded XML file successfully


[2m[36m(RolloutWorker pid=8578)[0m   logger.warn(
[2m[36m(RolloutWorker pid=8578)[0m   return ufunc.reduce(obj, axis, dtype, out, **passkwargs)
[2m[36m(RolloutWorker pid=8579)[0m   logger.warn(
[2m[36m(RolloutWorker pid=8579)[0m   return ufunc.reduce(obj, axis, dtype, out, **passkwargs)
[2m[36m(RolloutWorker pid=8577)[0m   logger.warn(
[2m[36m(RolloutWorker pid=8577)[0m   return ufunc.reduce(obj, axis, dtype, out, **passkwargs)


[2m[36m(SAC pid=8473)[0m Loaded XML file successfully


[2m[36m(SAC pid=8473)[0m   logger.warn(
[2m[36m(SAC pid=8473)[0m   return ufunc.reduce(obj, axis, dtype, out, **passkwargs)
[2m[36m(SAC pid=8473)[0m 2023-03-04 22:05:33,954	INFO trainable.py:172 -- Trainable.setup took 11.436 seconds. If your trainable is slow to initialize, consider setting reuse_actors=True to reduce actor creation overheads.
[2m[36m(RolloutWorker pid=8578)[0m   return ufunc.reduce(obj, axis, dtype, out, **passkwargs)
[2m[36m(RolloutWorker pid=8579)[0m   return ufunc.reduce(obj, axis, dtype, out, **passkwargs)
[2m[36m(RolloutWorker pid=8577)[0m   return ufunc.reduce(obj, axis, dtype, out, **passkwargs)
[2m[33m(raylet)[0m [2023-03-04 22:05:35,226 E 8212 8264] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-03-04_22-05-12_873660_8091 is over 95% full, available space: 309395456; capacity: 31845081088. Object creation will fail if spilling is required.


[2m[33m(raylet)[0m [2023-03-04 22:05:45,238 E 8212 8264] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-03-04_22-05-12_873660_8091 is over 95% full, available space: 301801472; capacity: 31845081088. Object creation will fail if spilling is required.


Trial name,agent_timesteps_total,counters,custom_metrics,date,done,episode_len_mean,episode_media,episode_reward_max,episode_reward_mean,episode_reward_min,episodes_this_iter,episodes_total,experiment_id,hostname,info,iterations_since_restore,node_ip,num_agent_steps_sampled,num_agent_steps_trained,num_env_steps_sampled,num_env_steps_sampled_this_iter,num_env_steps_trained,num_env_steps_trained_this_iter,num_faulty_episodes,num_healthy_workers,num_in_flight_async_reqs,num_remote_worker_restarts,num_steps_trained_this_iter,perf,pid,policy_reward_max,policy_reward_mean,policy_reward_min,sampler_perf,sampler_results,time_since_restore,time_this_iter_s,time_total_s,timers,timestamp,timesteps_since_restore,timesteps_total,training_iteration,trial_id,warmup_time
SAC_darm_DarmHand-v0_441d8_00000,24048,"{'num_env_steps_sampled': 24048, 'num_env_steps_trained': 0, 'num_agent_steps_sampled': 24048, 'num_agent_steps_trained': 0}",{},2023-03-04_22-13-03,False,2.39524,{},-1.72362,-11.3509,-38.8535,420,9932,e3f595c5d2ba460d86c03634807ab0fd,Daniel,"{'learner': {}, 'num_env_steps_sampled': 24048, 'num_env_steps_trained': 0, 'num_agent_steps_sampled': 24048, 'num_agent_steps_trained': 0}",24,192.168.93.36,24048,0,24048,1002,0,0,0,3,0,0,0,"{'cpu_util_percent': 70.3, 'ram_util_percent': 73.824}",8473,{},{},{},"{'mean_raw_obs_processing_ms': 1.7310121185639078, 'mean_inference_ms': 2.7685341099785785, 'mean_action_processing_ms': 0.24416055035653292, 'mean_env_wait_ms': 38.429847638479295, 'mean_env_render_ms': 0.0}","{'episode_reward_max': -1.72362071596495, 'episode_reward_min': -38.85352224854191, 'episode_reward_mean': -11.350921100289094, 'episode_len_mean': 2.395238095238095, 'episode_media': {}, 'episodes_this_iter': 420, 'policy_reward_min': {}, 'policy_reward_max': {}, 'policy_reward_mean': {}, 'custom_metrics': {}, 'hist_stats': {'episode_reward': [-10.245991080144384, -8.547734768318819, -9.432476686886917, -30.193930365564547, -10.073309502371437, -8.56415075699751, -8.480237826561648, -8.566435377292052, -6.952581825903833, -8.478006493090598, -15.352389314576442, -9.276726401995333, -8.479707242619693, -6.878436014124647, -7.973921682483152, -9.496301983182564, -6.254664882306285, -9.434364837867987, -6.226498639613418, -19.373562580067446, -8.562920120434603, -8.567117424303692, -20.175399000547745, -14.714355428969931, -18.63369893661234, -10.170108074891656, -6.874345761464333, -7.094541284130978, -10.171469597000128, -9.449129726601873, -9.423905118030063, -6.14488959648396, -17.907114743045494, -20.172734057909043, -10.171784394134484, -20.17092758881772, -7.67445771446288, -8.559190325686503, -7.7399063561637576, -10.176623308810713, -13.834490289720431, -6.1491097823153105, -10.159657910813271, -6.9400469004994365, -13.037352761038782, -17.7688374053206, -18.578464577508196, -8.554334535883207, -8.552009024227123, -16.155354487640924, -8.47948558679048, -18.54666330725534, -5.337101622260864, -18.66223141889287, -8.475691910405383, -6.166989986260496, -5.355283063716729, -19.361340429778064, -8.64759129881985, -30.20164884700625, -18.562440780618324, -7.744460658730951, -15.431192111333328, -3.17349853904721, -7.826758418305063, -7.7572994073549175, -7.052135277116246, -6.127036395020221, -8.550346066997095, -8.64464344847958, -13.80614462048766, -3.2118033476655485, -7.11486921497155, -7.754984263548274, -6.87964463971832, -8.649534362290655, -6.31912995332605, -5.34569196436833, -19.363457287421696, -9.283828369230964, -17.051124359822065, -17.032569895194957, -17.756633779327174, -10.088552729728757, -8.564102494238906, -9.435613340682256, -6.962382215721004, -7.6728882170723605, -7.050245648274552, -27.762522400428995, -8.556480706034941, -17.91440243841104, -8.562233039939505, -10.256779755877231, -7.67980938455122, -10.073326932418608, -7.856093506537468, -9.36439470014452, -9.279281483792076, -18.57293556671934, -8.644786244925518, -6.311437677903491, -18.56390729928166, -9.360157760080288, -18.710760995967327, -17.829384838972803, -7.748965670324662, -8.479319930705234, -5.448978570794594, -10.170818177763064, -20.271203781056272, -7.764163366622569, -7.760337878705135, -8.554795805808197, -7.743536849990398, -8.56579234655459, -18.56930795458686, -9.368540609960974, -29.37571875277647, -7.831428226949152, -10.083579350432158, -10.240651620994141, -10.087734142148152, -20.17619623460324, -8.548642378524406, -18.576058119251908, -10.178564871175526, -19.38029422384145, -10.16950715457368, -9.283630771722763, -17.769268760099237, -18.63670052528408, -9.279458021354987, -8.483879229259058, -6.149987033605681, -9.3699970168375, -19.35765525181303, -17.122577416688497, -6.148340869686653, -8.479523728550824, -9.62525812206577, -10.169177805653447, -9.29540116864736, -8.562693370458087, -10.083950229186225, -20.240996161479394, -7.768934926719619, -8.572274151141293, -18.795013525714065, -17.77522696613029, -9.270354065055594, -5.3419789249309915, -5.4343965556097125, -6.136672195342161, -7.039044892359543, -10.085211040365873, -16.973963480843565, -8.628351022873161, -6.949972260499814, -19.466273599181584, -18.65162192827899, -16.231113744778412, -6.959218983570343, -8.052674545443265, -10.16868358513125, -8.655750747116201, -10.155990919627857, -8.555058217174121, -7.831950736036273, -9.287765328585092, -18.577744455716882, -6.957462143631568, -19.376174574934026, -8.47014833993822, -10.087524476169696, -9.441797063136256, -8.36027410681623, -19.37126602947628, -10.092547996596057, -19.374927528657572, -8.558183859554818, -10.080634972962821, -20.153380579471758, -13.189925144742421, -20.26407542986189, -9.3624731317662, -10.086737384053302, -8.479882755715895, -7.822588757227888, -10.149365379592238, -7.741280055693386, -5.576263098770758, -10.16546152989559, -9.34778795141966, -19.3576947626475, -8.484163241951322, -6.220885091522396, -8.479977717786708, -7.03887347319789, -28.71408614218094, -9.427969762998023, -16.955418309094785, -6.947928598908286, -9.357118301737252, -9.51102169610295, -8.566313921941472, -7.75682586387744, -7.026973450167676, -7.7509884912044384, -9.456978418174318, -8.555880351567943, -4.615067930853334, -11.762654311120947, -9.447941868394903, -6.2422913578424755, -2.3232066353040253, -7.910443466681077, -16.982695645105114, -16.312633883116458, -19.366442257529158, -8.57765016813692, -6.137433337139986, -16.967731903381342, -10.154293503010367, -20.160552246178092, -7.6840033166906405, -18.71970441338924, -17.852258679161388, -6.226403779374798, -18.56464840459407, -10.089519169295652, -7.036359861897987, -10.16748533967374, -7.976104257670995, -10.245953814085276, -20.155917448766125, -18.581617267966763, -8.564991640577514, -8.476578384873202, -18.646215255741794, -6.319931438717303, -30.187165237252653, -10.081121648630305, -5.507412975770798, -10.168541806451698, -6.219860587813267, -10.086115692633097, -10.1692754076098, -7.035261572009135, -18.56486301870453, -9.363309741324228, -6.232388849566779, -4.624578221814368, -10.182905696545241, -9.29289022599403, -10.159863054384173, -9.35846177129209, -9.38837941671737, -9.353594352673083, -7.120943826432337, -8.481666005837434, -27.05874654075968, -17.04482919226417, -3.840553343092667, -10.08224008539047, -20.177101831332266, -8.559986387393218, -18.576108752227245, -16.24931967836715, -19.451124322276108, -10.087088749138001, -19.53757722409213, -8.573213385690043, -10.07633806925036, -8.482489110825288, -10.178017100605329, -10.251183773471196, -8.559893647268574, -10.08705824879294, -3.990859723888488, -10.182678350736875, -7.754582025122642, -5.348051950075704, -10.159411932603163, -2.9386092699578654, -19.523483892947016, -10.08499792535398, -5.351098808314134, -7.756217704027609, -19.61644633254796, -19.295016512679464, -9.284244309933637, -6.971192775797413, -8.638126058271574, -9.430889311852814, -20.17113695926114, -17.844902407175837, -10.167188439695284, -9.280961565268708, -10.163932556912588, -20.162574666990718, -10.164185923656143, -7.270477874757538, -8.556248530225774, -9.383700953291761, -10.180605309179366, -9.377759059007738, -8.663220655847816, -18.58662003439965, -7.781585053937363, -8.63096430285411, -8.554618754390903, -7.009191583716851, -6.305413646397316, -2.2811456707174136, -10.16756696634759, -10.24626173746133, -16.96277366986527, -6.207131489299878, -8.725266119435997, -3.888433335708891, -18.565224515979395, -6.15529097287256, -10.081818952503792, -10.264617433835934, -7.765222727684681, -7.921879451886241, -10.093792464241638, -9.345391864638849, -19.366219254246943, -8.538970938977648, -6.958984717752032, -28.588749286941706, -16.156583841623437, -7.135109877258527, -5.434097875452048, -5.439681786231042, -9.366092158317091, -7.0279373876383975, -1.72362071596495, -18.6477856786284, -7.832471588310828, -19.45432969101024, -9.445832663332315, -9.427588512563826, -19.37283514130595, -3.2834545443267524, -9.348628967749244, -8.482077808813838, -10.16878388277411, -6.54606708864036, -7.047421030893487, -10.176281012234886, -10.072884240555778, -7.83712394398566, -9.2762438953078, -9.370888228473682, -10.506748976434247, -10.164119377978377, -10.166216837167156, -16.961069713160196, -10.1671587868539, -8.48354264610808, -9.284553713311672, -8.613821005551891, -29.46721210604557, -17.829672850105258, -8.472961803120178, -9.44221431258228, -15.426983265226003, -8.473936916560309, -38.85352224854191, -8.558516619863745, -28.663808723988208, -10.078278096294076, -8.558515486823831, -8.649436065436284, -8.567191956654792, -7.678148536868539, -14.629765059898428, -20.169635555785078, -20.183325355289014, -17.843501573035965, -37.77838060555768, -27.1530949458881, -8.498936957075887, -6.209097597934279, -18.55644734431131, -10.088328766825375, -7.764116593740217, -7.7599825158359605, -5.358761494650594, -10.152694103895485, -20.164190890332918, -18.564762999056992, -10.087736488850956, -30.19085154058968, -7.677535157636543, -10.091773496237, -10.083595397711642, -5.4241336209524045, -16.725854295915955, -13.196575090692464, -8.560910775210951, -7.7680922214836245, -3.174335733178159, -6.159953455186166, -8.483348585318149, -9.524391539056301, -7.7647691970079915, -6.240224222076087, -16.236664314965044, -18.57094387930164, -10.178202944689444, -6.882602187338316, -9.373633328884921, -8.47166530628913, -17.038089930371157, -9.447005731522037, -8.642792757721049], 'episode_lengths': [3, 2, 3, 2, 1, 2, 1, 2, 2, 1, 2, 1, 1, 1, 5, 4, 3, 3, 3, 2, 2, 2, 2, 4, 3, 2, 1, 4, 2, 3, 3, 2, 4, 2, 2, 2, 1, 2, 2, 2, 3, 2, 2, 2, 3, 2, 2, 2, 2, 2, 1, 2, 2, 3, 1, 2, 2, 2, 3, 2, 2, 2, 3, 5, 3, 2, 3, 2, 2, 3, 3, 5, 4, 2, 1, 3, 4, 2, 2, 1, 3, 3, 2, 1, 2, 3, 2, 1, 3, 2, 2, 4, 2, 3, 1, 1, 3, 2, 1, 2, 3, 4, 2, 2, 4, 3, 2, 1, 3, 2, 3, 2, 2, 2, 2, 2, 2, 2, 2, 3, 1, 3, 1, 2, 2, 2, 2, 2, 2, 1, 2, 3, 1, 1, 2, 2, 2, 4, 2, 1, 5, 2, 1, 2, 1, 3, 2, 2, 5, 2, 1, 2, 3, 2, 3, 1, 2, 3, 2, 3, 3, 3, 2, 6, 2, 3, 2, 2, 3, 1, 2, 2, 2, 1, 1, 3, 5, 2, 1, 2, 2, 1, 2, 5, 3, 2, 1, 1, 3, 2, 2, 5, 2, 2, 2, 1, 3, 1, 3, 4, 3, 2, 2, 2, 4, 2, 2, 3, 2, 3, 2, 3, 7, 3, 3, 4, 4, 2, 4, 2, 2, 2, 2, 2, 2, 1, 4, 3, 3, 2, 1, 3, 2, 5, 3, 2, 2, 2, 1, 3, 4, 2, 1, 4, 2, 3, 1, 2, 3, 2, 2, 3, 3, 2, 1, 2, 2, 2, 2, 4, 1, 3, 3, 3, 1, 2, 2, 2, 3, 3, 1, 4, 2, 1, 1, 2, 3, 2, 1, 5, 2, 2, 2, 2, 2, 4, 1, 2, 2, 5, 1, 1, 2, 3, 3, 2, 3, 2, 1, 2, 2, 2, 6, 2, 2, 2, 2, 3, 2, 2, 3, 2, 3, 4, 4, 2, 3, 2, 3, 4, 4, 2, 2, 1, 3, 2, 4, 1, 2, 2, 2, 2, 2, 2, 4, 3, 3, 2, 3, 7, 3, 3, 3, 3, 3, 2, 6, 2, 1, 2, 7, 3, 2, 1, 3, 1, 2, 6, 2, 2, 2, 2, 1, 1, 3, 3, 3, 1, 3, 3, 1, 5, 2, 3, 1, 2, 3, 2, 1, 3, 2, 2, 3, 2, 4, 1, 3, 2, 1, 2, 2, 2, 2, 2, 2, 1, 2, 1, 1, 1, 3, 9, 5, 2, 2, 5, 2, 1, 4, 2, 3, 3, 2, 2, 1, 2, 1, 3, 3, 3]}, 'sampler_perf': {'mean_raw_obs_processing_ms': 1.7310121185639078, 'mean_inference_ms': 2.7685341099785785, 'mean_action_processing_ms': 0.24416055035653292, 'mean_env_wait_ms': 38.429847638479295, 'mean_env_render_ms': 0.0}, 'num_faulty_episodes': 0}",448.089,18.0154,448.089,{'training_iteration_time_ms': 51.044},1677964383,0,24048,24,441d8_00000,11.4449


[2m[33m(raylet)[0m [2023-03-04 22:05:55,244 E 8212 8264] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-03-04_22-05-12_873660_8091 is over 95% full, available space: 301641728; capacity: 31845081088. Object creation will fail if spilling is required.
[2m[33m(raylet)[0m [2023-03-04 22:06:05,250 E 8212 8264] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-03-04_22-05-12_873660_8091 is over 95% full, available space: 305246208; capacity: 31845081088. Object creation will fail if spilling is required.
[2m[33m(raylet)[0m [2023-03-04 22:06:15,256 E 8212 8264] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-03-04_22-05-12_873660_8091 is over 95% full, available space: 305152000; capacity: 31845081088. Object creation will fail if spilling is required.
[2m[33m(raylet)[0m [2023-03-04 22:06:25,265 E 8212 8264] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-03-04_22-05-12_873660_8091 is over 95% full, available space: 305037312; capacity: 

In [16]:
# Ensure wandb is sysncing to cloud
# cd to darm_training again if not

In [10]:
# TODO:
# change: experiment name

# Restore Interrupted run
tuner = tune.Tuner.restore(
    f"{wandb_init['config']['run_local_dir']}/{run_name}",
    resume_errored=True
)
tuner

2023-02-11 17:26:13,607	INFO experiment_analysis.py:795 -- No `self.trials`. Drawing logdirs from checkpoint file. This may result in some information that is out of sync, as checkpointing is periodic.


<ray.tune.tuner.Tuner at 0x7fede99d9a90>

[2m[33m(raylet)[0m [2023-02-11 17:26:16,601 E 14732 14777] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_17-23-24_266872_14581 is over 95% full, available space: 1061720064; capacity: 31845081088. Object creation will fail if spilling is required.


In [15]:
results = tuner.get_results()
results

<ray.tune.result_grid.ResultGrid at 0x7fcd58384b80>

In [16]:
# Get the best result based on a particular metric.
best_result = results.get_best_result(metric="episode_reward_mean", mode="max")
best_result

Result(metrics={'custom_metrics': {}, 'episode_media': {}, 'info': {'learner': {'default_policy': {'learner_stats': {'allreduce_latency': 0.0, 'grad_gnorm': 8.343955039978027, 'actor_loss': -5.076763153076172, 'critic_loss': 0.4612053632736206, 'alpha_loss': -0.850807249546051, 'alpha_value': 0.9030595, 'log_alpha_value': -0.101966895, 'target_entropy': -5.0, 'policy_t': -0.01997794397175312, 'mean_q': 2.0334110260009766, 'max_q': 2.8355112075805664, 'min_q': 1.038293480873108}, 'td_error': array([9.46030378e-01, 4.29627061e-01, 2.65497327e-01, 8.43869328e-01,
       1.09686172e+00, 7.66791701e-01, 7.26696014e-01, 5.70532084e-02,
       1.14584994e+00, 4.43507016e-01, 1.04901314e-01, 1.52089047e+00,
       6.52013183e-01, 8.16148460e-01, 1.08409297e+00, 2.61833251e-01,
       3.79876256e-01, 9.56449747e-01, 5.75677335e-01, 1.02149987e+00,
       1.76170349e-01, 9.50863540e-01, 7.04805613e-01, 3.25276971e-01,
       6.36387825e-01, 8.46629441e-01, 5.59558868e-02, 8.83865356e-03,
       

In [17]:
# Get the best checkpoint corresponding to the best result.
best_checkpoint = best_result.checkpoint
best_checkpoint

Checkpoint(local_path=/home/daniel/DARM/darm_mujoco/darm_training/results/Test_DARMSF_DELTA_TARGET/SAC_darm_DarmSFHand-v0_a1dbe_00000_0_2023-02-11_16-49-13/results/Test_DARMSF_DELTA_TARGET/SAC_darm_DarmSFHand-v0_ad8de_00000_0_2023-02-11_16-56-43/checkpoint_000011)

[2m[33m(raylet)[0m [2023-02-11 17:00:32,579 E 9254 9299] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_16-49-09_974082_9002 is over 95% full, available space: 1129005056; capacity: 31845081088. Object creation will fail if spilling is required.
[2m[33m(raylet)[0m [2023-02-11 17:00:42,596 E 9254 9299] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_16-49-09_974082_9002 is over 95% full, available space: 1129254912; capacity: 31845081088. Object creation will fail if spilling is required.
[2m[33m(raylet)[0m [2023-02-11 17:00:52,615 E 9254 9299] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_16-49-09_974082_9002 is over 95% full, available space: 1129238528; capacity: 31845081088. Object creation will fail if spilling is required.


In [11]:
# Get Algorithm from saved checkpoint
from ray.rllib.algorithms.algorithm import Algorithm
algo = Algorithm.from_checkpoint(best_checkpoint._local_path)
algo

2023-02-11 16:38:32,949	INFO algorithm.py:501 -- Current log_level is WARN. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[33m(raylet)[0m [2023-02-11 16:38:35,741 E 6815 6860] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_16-34-33_438228_6699 is over 95% full, available space: 1174347776; capacity: 31845081088. Object creation will fail if spilling is required.


[2m[36m(RolloutWorker pid=7501)[0m Loaded XML file successfully


[2m[36m(RolloutWorker pid=7501)[0m   logger.warn(
[2m[36m(RolloutWorker pid=7500)[0m   logger.warn(


[2m[36m(RolloutWorker pid=7500)[0m Loaded XML file successfully


[2m[36m(RolloutWorker pid=7502)[0m   logger.warn(


[2m[36m(RolloutWorker pid=7502)[0m Loaded XML file successfully


  logger.warn(


Loaded XML file successfully


SAC

In [11]:
# resume the interrupted run
tuner.fit()

2023-02-11 17:26:26,421	INFO trial_runner.py:688 -- A local experiment checkpoint was found and will be used to restore the previous experiment state.
2023-02-11 17:26:26,422	INFO trial_runner.py:825 -- Using following checkpoint to resume: /home/daniel/DARM/darm_mujoco/darm_training/results/Test_DARMSF_DELTA_TARGET/experiment_state-2023-02-11_17-23-28.json
2023-02-11 17:26:26,440	INFO tune.py:653 -- TrialRunner resumed, ignoring new add_experiment but updating trial resources.


0,1
Current time:,2023-02-11 17:29:20
Running for:,00:02:54.01
Memory:,6.3/7.5 GiB

Trial name,status,loc,iter,total time (s),ts,reward,episode_reward_max,episode_reward_min,episode_len_mean
SAC_darm_DarmSFHand-v0_6a944_00000,RUNNING,192.168.152.36:15703,13,227.817,13026,-179.588,-166.097,-189.684,100


[2m[33m(raylet)[0m [2023-02-11 17:26:26,618 E 14732 14777] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_17-23-24_266872_14581 is over 95% full, available space: 1061683200; capacity: 31845081088. Object creation will fail if spilling is required.
[34m[1mwandb[0m: Currently logged in as: [33mdanieladejumo[0m. Use [1m`wandb login --relogin`[0m to force relogin
[2m[36m(SAC pid=15703)[0m 2023-02-11 17:26:31,413	INFO algorithm.py:501 -- Current log_level is WARN. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.


[2m[33m(raylet)[0m [2023-02-11 17:26:36,627 E 14732 14777] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_17-23-24_266872_14581 is over 95% full, available space: 1061359616; capacity: 31845081088. Object creation will fail if spilling is required.


[2m[36m(RolloutWorker pid=15846)[0m Loaded XML file successfully
[2m[36m(RolloutWorker pid=15844)[0m Loaded XML file successfully


[2m[36m(RolloutWorker pid=15846)[0m   logger.warn(
[2m[36m(RolloutWorker pid=15844)[0m   logger.warn(


[2m[36m(RolloutWorker pid=15845)[0m Loaded XML file successfully


[2m[36m(RolloutWorker pid=15845)[0m   logger.warn(
[2m[36m(SAC pid=15703)[0m   logger.warn(


[2m[36m(SAC pid=15703)[0m Loaded XML file successfully


[2m[36m(SAC pid=15703)[0m 2023-02-11 17:26:40,442	INFO trainable.py:790 -- Restored on 192.168.152.36 from checkpoint: /tmp/checkpoint_tmp_7f50b6e15e2c473dba807bf1d398566d
[2m[36m(SAC pid=15703)[0m 2023-02-11 17:26:40,442	INFO trainable.py:799 -- Current state after restoring: {'_iteration': 11, '_timesteps_total': None, '_time_total': 113.04964661598206, '_episodes_total': 114}
[2m[33m(raylet)[0m [2023-02-11 17:26:46,634 E 14732 14777] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_17-23-24_266872_14581 is over 95% full, available space: 1061335040; capacity: 31845081088. Object creation will fail if spilling is required.
[2m[33m(raylet)[0m [2023-02-11 17:26:56,640 E 14732 14777] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_17-23-24_266872_14581 is over 95% full, available space: 1061343232; capacity: 31845081088. Object creation will fail if spilling is required.
[2m[33m(raylet)[0m [2023-02-11 17:27:06,648 E 14732 14777] (raylet) f

Trial name,agent_timesteps_total,counters,custom_metrics,date,done,episode_len_mean,episode_media,episode_reward_max,episode_reward_mean,episode_reward_min,episodes_this_iter,episodes_total,experiment_id,hostname,info,iterations_since_restore,node_ip,num_agent_steps_sampled,num_agent_steps_trained,num_env_steps_sampled,num_env_steps_sampled_this_iter,num_env_steps_trained,num_env_steps_trained_this_iter,num_faulty_episodes,num_healthy_workers,num_in_flight_async_reqs,num_remote_worker_restarts,num_steps_trained_this_iter,perf,pid,policy_reward_max,policy_reward_mean,policy_reward_min,sampler_perf,sampler_results,time_since_restore,time_this_iter_s,time_total_s,timers,timestamp,timesteps_since_restore,timesteps_total,training_iteration,trial_id,warmup_time
SAC_darm_DarmSFHand-v0_6a944_00000,13026,"{'num_env_steps_sampled': 13026, 'num_env_steps_trained': 258304, 'num_agent_steps_sampled': 13026, 'num_agent_steps_trained': 258304, 'last_target_update_ts': 13026, 'num_target_updates': 1009}",{},2023-02-11_17-28-35,False,100,{},-166.097,-179.588,-189.684,9,132,2674246d3b814ef583cb37ca785123d2,Daniel,"{'learner': {'default_policy': {'learner_stats': {'allreduce_latency': 0.0, 'grad_gnorm': 8.40356159210205, 'actor_loss': -4.885239601135254, 'critic_loss': 0.3069121241569519, 'alpha_loss': -2.5390048027038574, 'alpha_value': 0.7392387, 'log_alpha_value': -0.30213442, 'target_entropy': -5.0, 'policy_t': -0.029988128691911697, 'mean_q': 2.379087448120117, 'max_q': 3.1470589637756348, 'min_q': 1.5433847904205322}, 'td_error': array([7.4213958e-01, 1.5848637e-01, 6.0251343e-01, 9.3348145e-01,  7.2470105e-01, 6.5075898e-01, 7.4386942e-01, 4.2802992e+00,  4.9475217e-01, 2.1274698e-01, 1.5443254e-01, 2.0181298e-01,  4.8542452e-01, 4.9696553e-01, 3.7915547e+00, 8.3584547e-02,  8.3843565e-01, 7.5096285e-01, 6.2452388e-01, 2.4125576e-01,  7.7261329e-01, 2.6608777e-01, 3.3530772e-01, 2.6860654e-01,  1.5399015e-01, 7.0978558e-01, 7.8079522e-01, 1.0731530e-01,  8.8066232e-01, 1.1126903e+00, 3.6070585e-02, 6.7874563e-01,  7.5406009e-01, 4.2981052e-01, 1.1391871e+00, 3.9740098e-01,  1.0762990e+00, 8.4136343e-01, 5.8252001e-01, 4.0861154e-01,  5.6281984e-01, 2.7024639e-01, 6.9000638e-01, 8.6244369e-01,  5.7595563e-01, 7.2603118e-01, 5.9470689e-01, 2.7473211e-01,  5.6826186e-01, 2.4650784e+02, 9.8598832e-01, 7.3479068e-01,  6.1449623e-01, 1.2699622e+00, 7.5296319e-01, 2.8090358e-02,  9.4109213e-01, 8.2771111e-01, 4.2838442e-01, 3.8090675e+00,  4.7546709e-01, 2.4742079e-01, 4.1203547e-01, 7.3801911e-01,  1.0025257e+00, 6.7763782e-01, 6.7099619e-01, 8.6762822e-01,  5.6190348e-01, 8.8954902e-01, 8.1222010e-01, 8.6386180e-01,  7.6953566e-01, 1.0633967e+00, 5.9996891e-01, 5.3750610e-01,  7.0670819e-01, 4.9724150e-01, 3.3370614e-02, 6.8903613e-01,  9.4764221e-01, 5.0915122e-02, 5.0027347e-01, 9.6055913e-01,  5.5192137e-01, 7.9515433e-01, 7.2671640e-01, 3.9931262e-01,  1.8239129e-01, 9.9649012e-01, 8.4206927e-01, 4.1600978e-01,  4.0527940e-01, 7.6102638e-01, 2.3393106e-01, 4.7766042e-01,  2.2459340e-01, 8.5827851e-01, 1.4306033e-01, 2.4650784e+02,  7.1198571e-01, 3.9922416e+00, 1.2246186e+00, 7.4194229e-01,  2.7496171e-01, 4.5212805e-02, 7.4664807e-01, 1.3847947e-02,  8.7445688e-01, 6.6402781e-01, 1.0255686e+00, 4.5125723e-01,  4.8755097e-01, 2.4650784e+02, 4.4124365e-01, 1.0487792e+00,  5.8346188e-01, 2.6959336e-01, 3.5287654e-01, 5.9907603e-01,  4.8603582e-01, 6.1551094e-01, 6.9831514e-01, 5.1433253e-01,  1.8200487e-01, 9.6122825e-01, 7.8497732e-01, 2.2768998e-01,  9.6964097e-01, 1.4972503e+00, 8.0229974e-01, 1.0484257e+00,  5.5421102e-01, 8.3084774e-01, 4.7661805e-01, 3.9173824e-01,  3.1396019e-01, 4.2802992e+00, 2.7052438e-01, 2.6957560e-01,  7.5368738e-01, 4.4456518e-01, 3.1527257e-01, 8.5121763e-01,  9.0664178e-01, 9.4629610e-01, 5.6297445e-01, 5.9285718e-01,  6.3104606e-01, 5.2718985e-01, 6.5370166e-01, 7.0399725e-01,  4.5417070e-02, 2.4650784e+02, 7.2803473e-01, 1.1245636e+00,  3.7708211e-01, 3.7433398e-01, 4.3422055e-01, 3.2808065e-01,  6.2305951e-01, 1.7103601e-01, 7.9449832e-01, 1.3040452e+00,  7.1471536e-01, 4.5487504e+00, 4.1272748e-01, 6.5745860e-01,  6.6768157e-01, 8.8028562e-01, 7.0535421e-01, 5.2402341e-01,  5.6226981e-01, 5.4202604e-01, 2.7826047e-01, 2.6031137e-01,  6.0549617e-02, 3.6561573e-01, 2.4650784e+02, 8.0606019e-01,  8.4074116e-01, 4.9388194e-01, 7.1800745e-01, 2.9282093e-02,  1.9090211e-01, 3.8544512e-01, 1.4638956e+00, 1.4547678e+00,  1.0922147e+00, 2.6176953e-01, 1.3020796e-01, 5.6222248e-01,  5.6339896e-01, 7.6045167e-01, 7.8438163e-01, 7.5755298e-01,  8.2661462e-01, 3.5743856e-01, 1.3571662e-01, 5.3244066e-01,  8.8719201e-01, 8.2828355e-01, 3.8229942e-01, 6.0678411e-01,  4.7898412e-01, 8.2518208e-01, 5.2971601e-01, 6.7987609e-01,  7.6182199e-01, 1.0264168e+00, 6.2066817e-01, 9.0486789e-01,  4.7908902e-01, 1.1681950e-01, 7.6850456e-01, 3.1422675e-01,  9.3148047e-01, 9.5507002e-01, 8.3421135e-01, 5.6414163e-01,  4.1598296e-01, 5.0719857e-02, 9.6793044e-01, 1.4145180e+00,  1.4200950e-01, 8.1434751e-01, 7.0387411e-01, 8.6176515e-01,  6.2346458e-01, 1.4636874e-01, 3.2455921e-01, 1.5807381e+00,  5.9650755e-01, 7.9351628e-01, 1.6089365e+00, 7.5115800e-01,  5.8976293e-01, 4.7450304e-02, 6.6682827e-01, 7.1542680e-01,  4.6520185e-01, 3.4638846e-01, 7.5957966e-01, 4.9341345e-01,  4.8143768e-01, 1.2025452e-01, 6.0646594e-01, 1.1619196e+00,  2.7393532e-01, 8.4904301e-01, 2.5427663e-01, 7.0259297e-01,  5.2577734e-01, 2.9342413e-01, 6.1365223e-01, 9.0736806e-01],  dtype=float32), 'mean_td_error': 5.492199897766113, 'model': {}, 'custom_metrics': {}, 'num_agent_steps_trained': 256.0, 'num_grad_updates_lifetime': 668.0, 'diff_num_grad_updates_vs_sampler_policy': 667.0}}, 'num_env_steps_sampled': 13026, 'num_env_steps_trained': 258304, 'num_agent_steps_sampled': 13026, 'num_agent_steps_trained': 258304, 'last_target_update_ts': 13026, 'num_target_updates': 1009}",2,192.168.152.36,13026,258304,13026,1002,258304,85504,0,3,0,0,85504,"{'cpu_util_percent': 54.76744186046512, 'ram_util_percent': 85.32209302325585}",15703,{},{},{},"{'mean_raw_obs_processing_ms': 1.3155451329359085, 'mean_inference_ms': 2.6820931912181267, 'mean_action_processing_ms': 0.25946855188663404, 'mean_env_wait_ms': 3.287473482817159, 'mean_env_render_ms': 0.0}","{'episode_reward_max': -166.09740307927132, 'episode_reward_min': -189.6840973868966, 'episode_reward_mean': -179.5880893824829, 'episode_len_mean': 100.0, 'episode_media': {}, 'episodes_this_iter': 9, 'policy_reward_min': {}, 'policy_reward_max': {}, 'policy_reward_mean': {}, 'custom_metrics': {}, 'hist_stats': {'episode_reward': [-187.3498569726944, -166.09740307927132, -172.9712873697281, -187.82146245241165, -176.65354753285646, -183.53197374939919, -176.7706963941455, -189.6840973868966, -175.4124795049429], 'episode_lengths': [100, 100, 100, 100, 100, 100, 100, 100, 100]}, 'sampler_perf': {'mean_raw_obs_processing_ms': 1.3155451329359085, 'mean_inference_ms': 2.6820931912181267, 'mean_action_processing_ms': 0.25946855188663404, 'mean_env_wait_ms': 3.287473482817159, 'mean_env_render_ms': 0.0}, 'num_faulty_episodes': 0}",114.767,62.318,227.817,"{'training_iteration_time_ms': 151.985, 'load_time_ms': 0.246, 'load_throughput': 1042265.409, 'learn_time_ms': 25.824, 'learn_throughput': 9913.287, 'synch_weights_time_ms': 6.049}",1676132915,0,13026,13,6a944_00000,9.03385


[34m[1mwandb[0m: Adding directory to artifact (/home/daniel/DARM/darm_mujoco/darm_training/results/Test_DARMSF_DELTA_TARGET/SAC_darm_DarmSFHand-v0_6a944_00000_0_2023-02-11_17-23-28/checkpoint_000012)... Done. 0.0s
[2m[33m(raylet)[0m [2023-02-11 17:27:36,665 E 14732 14777] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_17-23-24_266872_14581 is over 95% full, available space: 1055997952; capacity: 31845081088. Object creation will fail if spilling is required.
[2m[33m(raylet)[0m [2023-02-11 17:27:46,672 E 14732 14777] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_17-23-24_266872_14581 is over 95% full, available space: 1055973376; capacity: 31845081088. Object creation will fail if spilling is required.
[2m[33m(raylet)[0m [2023-02-11 17:27:56,678 E 14732 14777] (raylet) file_system_monitor.cc:105: /tmp/ray/session_2023-02-11_17-23-24_266872_14581 is over 95% full, available space: 1055977472; capacity: 31845081088. Object creation will fai

<ray.tune.result_grid.ResultGrid at 0x7fedc40a1d90>