# Setting up a Ray cluster with SmartSim

## 1. Start the cluster
We set up a SmartSim experiment, which will handle the launch of the Ray cluster.

First we import the relevant modules.

In [1]:
%env SMARTSIM_LOG_LEVEL developer

env: SMARTSIM_LOG_LEVEL=developer


In [2]:
import numpy as np
import time
import argparse
import os

from ray.tune.progress_reporter import JupyterNotebookReporter
import ray
from ray import tune
import ray.util

from smartsim import Experiment
from smartsim.ray import RayCluster

from smartsim.launcher import slurm

NUM_WORKERS = 3
alloc=None
launcher='slurm'
#alloc=slurm.get_allocation(nodes=1+NUM_WORKERS, time="12:00:00", options={"ntasks": str(1+NUM_WORKERS), "partition": "spider", "C": "V100"})
alloc=slurm.get_allocation(nodes=1+NUM_WORKERS, time="12:00:00", options={"ntasks": str(1+NUM_WORKERS)})

13:59:56 nid00000 smartsim.launcher.slurm.slurm[48868] DEBUG Allocation settings: -N 4 -J SmartSim -t 12:00:00 --ntasks=4
13:59:56 nid00000 smartsim.launcher.util.shell[48868] DEBUG Executing Popen cmd: /opt/slurm/20.11.5/bin/salloc --no-shell -N 4 -J SmartSim -t 12:00:00 --ntasks=4
14:00:26 nid00000 smartsim.launcher.slurm.slurm[48868] INFO Allocation successful with Job ID: 1461743


In [3]:
exp = Experiment("ray-cluster", launcher=launcher)
cluster = RayCluster(name="ray-cluster", run_args={}, path='',
                     launcher=launcher, workers=NUM_WORKERS, alloc=alloc, batch=False)

if cluster.batch:
    cluster.head_model.batch_settings.add_preamble( ["source ~/.bashrc", "conda activate smartsim"])
    if NUM_WORKERS:
        cluster.worker_model.batch_settings.add_preamble ( ["source ~/.bashrc", "conda activate smartsim"])

exp.generate(cluster, overwrite=True)

14:00:32 nid00000 smartsim.generation.generator[48868] INFO Working in previously created experiment


In [4]:
exp.start(cluster, block=False, summary=False)

14:00:33 nid00000 smartsim.launcher.taskManager[48868] DEBUG Starting Task Manager
14:00:33 nid00000 smartsim.launcher.util.shell[48868] DEBUG Executing command: srun --output /lus/cls01029/arigazzi/smartsim-dev/SmartSim/tutorials/05_starting_ray/ray-cluster/head/head.out --error /lus/cls01029/arigazzi/smartsim-dev/SmartSim/tutorials/05_starting_ray/ray-cluster/head/head.err --job-name head-CCY76DP17ELD --jobid 1461743 --unbuffered --nodes=1 --time=01:00:00 --ntasks=1 --ntasks-per-node=1 python /lus/cls01029/arigazzi/smartsim-dev/SmartSim/smartsim/ray/raystarter.py --port=6780 --redis-password=80f909ec-a442-4493-9712-71d10bec7439
14:00:33 nid00000 smartsim.launcher.taskManager[48868] DEBUG Starting Task 49029
14:00:35 nid00000 smartsim.launcher.util.shell[48868] DEBUG Executing Popen cmd: /opt/slurm/20.11.5/bin/sacct --noheader -p --format=jobname,jobid
14:00:36 nid00000 smartsim.control.controller[48868] DEBUG Launching head
14:00:36 nid00000 smartsim.launcher.util.shell[48868] DEBUG 

## 2. Start the ray driver script

In [5]:
ray.util.connect(cluster.head_model.address +":10001")

In [6]:
print('''This cluster consists of
    {} nodes in total
    {} CPU resources in total
'''.format(len(ray.nodes()), ray.cluster_resources()['CPU']))

This cluster consists of
    4 nodes in total
    152.0 CPU resources in total



In [7]:
tune.run(
    "PPO",
    stop={"episode_reward_max": 200},
    config={
        "framework": "torch",
        "env": "CartPole-v0",
        "num_gpus": 0,
        "lr": tune.grid_search(np.linspace (0.001, 0.01, 2).tolist()),
        "log_level": "ERROR",
    },
    local_dir="/lus/scratch/arigazzi/ray_local/",
    verbose=1,
    fail_fast=True,
    log_to_file=True,
)

[2m[36m(pid=25010)[0m Instructions for updating:
[2m[36m(pid=25010)[0m non-resource variables are not supported in the long term


[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 5.8/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 3.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 2/2 (1 PENDING, 1 RUNNING)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=25038)[0m Instructions for updating:
[2m[36m(pid=25038)[0m non-resource variables are not supported in the long term
[2m[36m(pid=25038)[0m 2021-07-20 11:37:15,728	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=25036)[0m Instructions for updating:
[2m[36m(pid=25036)[0m non-resource variables are not supported in the long term
[2m[36m(pid=25037)[0m Instructions for updating:
[2m[36m(pid=25037)[0m non-resource variables are not supported in the long term
[2m[36m(pid=95527)[0m Instructions for updating:
[2m[36m(pid=95527)[0m non-resource variables are not supported in the long term


[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 6.3/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 6.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 2/2 (2 RUNNING)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=95527)[0m 2021-07-20 11:37:27,106	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=95526)[0m Instructions for updating:
[2m[36m(pid=95526)[0m non-resource variables are not supported in the long term
[2m[36m(pid=95528)[0m Instructions for updating:
[2m[36m(pid=95528)[0m non-resource variables are not supported in the long term


[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 6.3/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 6.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 2/2 (2 RUNNING)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 6.3/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 3.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 2/2 (1 RUNNING, 1 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[

[2m[36m(pid=25010)[0m 2021-07-20 11:37:49,901	INFO tune.py:549 -- Total run time: 114.79 seconds (37.26 seconds for the tuning loop).


Instructions for updating:
non-resource variables are not supported in the long term


<ray.tune.analysis.experiment_analysis.ExperimentAnalysis at 0x7fffd8dee130>

## 3. Stop cluster and release allocation

In [5]:
if alloc:
    slurm.release_allocation(alloc)

In [5]:
exp.stop(cluster)

In [8]:

tune.run(
    "PPO",
    stop={"episode_reward_max": 200},
    config={
        "framework": "torch",
        "env": "CartPole-v0",
    #    "num_gpus": 0,
        "lr": tune.grid_search(np.linspace (0.001, 0.01, 200).tolist()),
        "log_level": "ERROR",
    #    "num_cpus_per_worker": 1,
    },
    local_dir="/lus/scratch/arigazzi/ray_local/",
    verbose=1,
    #fail_fast=True,
    #log_to_file=True,
    #progress_reporter = JupyterNotebookReporter(True),
)

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 6.0/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 3.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (199 PENDING, 1 RUNNING)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=25031)[0m Instructions for updating:
[2m[36m(pid=25031)[0m non-resource variables are not supported in the long term
[2m[36m(pid=25030)[0m Instructions for updating:
[2m[36m(pid=25030)[0m non-resource variables are not supported in the long term
[2m[36m(pid=25032)[0m Instructions for updating:
[2m[36m(pid=25032)[0m non-resource variables are not supported in the long term
[2m[36m(pid=95507)[0m Instructions for updating:
[2m[36m(pid=95507)[0m non-resource variables are not supported in the long term
[2m[36m(pid=95515)[0m Instructions for updating:
[2m[36m(pid=95515)[0m non-resource variables are not supported in the long term
[2m[36m(pid=25024)[0m Instructions for updating:
[2m[36m(pid=25024)[0m non-resource variables are not supported in the long term
[2m[36m(pid=95514)[0m Instructions for updating:
[2m[36m(pid=95514)[0m non-resource variables are not supported in the long term
[2m[36m(pid=25025)[0m Instructions for updating:
[2

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 11.1/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (150 PENDING, 50 RUNNING)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=96075)[0m 2021-07-20 11:40:30,620	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=96090)[0m Instructions for updating:
[2m[36m(pid=96090)[0m non-resource variables are not supported in the long term
[2m[36m(pid=96097)[0m Instructions for updating:
[2m[36m(pid=96097)[0m non-resource variables are not supported in the long term
[2m[36m(pid=96102)[0m Instructions for updating:
[2m[36m(pid=96102)[0m non-resource variables are not supported in the long term
[2m[36m(pid=96101)[0m Instructions for updating:
[2m[36m(pid=96101)[0m non-resource variables are not supported in the long term
[2m[36m(pid=96168)[0m Instructions for updating:
[2m[36m(pid=96168)[0m non-resource variables are not supported in the long term
[2m[36m(pid=96095)[0m Instructions for updating:
[2m[36m(pid=96095)[0m non-resource variables are not supported in the long term
[2m

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.0/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (150 PENDING, 50 RUNNING)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.0/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (150 PENDING, 50 RUNNING)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=96600)[0m Instructions for updating:
[2m[36m(pid=96600)[0m non-resource variables are not supported in the long term


[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.6/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (143 PENDING, 50 RUNNING, 7 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=96600)[0m 2021-07-20 11:40:56,504	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=98327)[0m Instructions for updating:
[2m[36m(pid=98327)[0m non-resource variables are not supported in the long term
[2m[36m(pid=98329)[0m Instructions for updating:
[2m[36m(pid=98329)[0m non-resource variables are not supported in the long term
[2m[36m(pid=98325)[0m Instructions for updating:
[2m[36m(pid=98325)[0m non-resource variables are not supported in the long term
[2m[36m(pid=98328)[0m Instructions for updating:
[2m[36m(pid=98328)[0m non-resource variables are not supported in the long term
[2m[36m(pid=98327)[0m 2021-07-20 11:40:58,179	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=98329)[0m 2021-07-20 11:40:58,179	INFO trainer.py:694 -- Current log_level 

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 13.7/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (141 PENDING, 50 RUNNING, 9 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=28520)[0m Instructions for updating:
[2m[36m(pid=28520)[0m non-resource variables are not supported in the long term
[2m[36m(pid=28477)[0m Instructions for updating:
[2m[36m(pid=28477)[0m non-resource variables are not supported in the long term
[2m[36m(pid=28468)[0m Instructions for updating:
[2m[36m(pid=28468)[0m non-resource variables are not supported in the long term
[2m[36m(pid=28469)[0m Instructions for updating:
[2m[36m(pid=28469)[0m non-resource variables are not supported in the long term
[2m[36m(pid=98371)[0m Instructions for updating:
[2m[36m(pid=98371)[0m non-resource variables are not supported in the long term
[2m[36m(pid=104142)[0m Instructions for updating:
[2m[36m(pid=104142)[0m non-resource variables are not supported in the long term
[2m[36m(pid=98371)[0m 2021-07-20 11:41:03,835	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 15.0/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (126 PENDING, 50 RUNNING, 24 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=101721)[0m 2021-07-20 11:41:06,543	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=99516)[0m Instructions for updating:
[2m[36m(pid=99516)[0m non-resource variables are not supported in the long term
[2m[36m(pid=99521)[0m Instructions for updating:
[2m[36m(pid=99521)[0m non-resource variables are not supported in the long term
[2m[36m(pid=99520)[0m Instructions for updating:
[2m[36m(pid=99520)[0m non-resource variables are not supported in the long term
[2m[36m(pid=99522)[0m Instructions for updating:
[2m[36m(pid=99522)[0m non-resource variables are not supported in the long term
[2m[36m(pid=104590)[0m Instructions for updating:
[2m[36m(pid=104590)[0m non-resource variables are not supported in the long term
[2m[36m(pid=99556)[0m Instructions for updating:
[2m[36m(pid=99556)[0m non-resource variables are not supported in the long term
[

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 12.4/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (118 PENDING, 49 RUNNING, 33 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=29763)[0m 2021-07-20 11:41:11,623	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=29748)[0m Instructions for updating:
[2m[36m(pid=29748)[0m non-resource variables are not supported in the long term
[2m[36m(pid=29753)[0m Instructions for updating:
[2m[36m(pid=29753)[0m non-resource variables are not supported in the long term
[2m[36m(pid=29751)[0m Instructions for updating:
[2m[36m(pid=29751)[0m non-resource variables are not supported in the long term
[2m[36m(pid=29754)[0m Instructions for updating:
[2m[36m(pid=29754)[0m non-resource variables are not supported in the long term
[2m[36m(pid=29746)[0m Instructions for updating:
[2m[36m(pid=29746)[0m non-resource variables are not supported in the long term
[2m[36m(pid=29742)[0m Instructions for updating:
[2m[36m(pid=29742)[0m non-resource variables are not supported in the long term
[2m

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.1/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (103 PENDING, 49 RUNNING, 48 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=105514)[0m Instructions for updating:
[2m[36m(pid=105514)[0m non-resource variables are not supported in the long term
[2m[36m(pid=105498)[0m 2021-07-20 11:41:16,788	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=105507)[0m 2021-07-20 11:41:16,851	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=105593)[0m 2021-07-20 11:41:17,009	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=100495)[0m Instructions for updating:
[2m[36m(pid=100495)[0m non-resource variables are not supported in the long term
[2m[36m(pid=102889)[0m Instructions for updating:
[2m[36m(pid=102889)[0m non-resource variables are not supported in the long term
[2m[36m(pid=102887)[0m Instr

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 13.9/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (102 PENDING, 50 RUNNING, 48 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=31639)[0m Instructions for updating:
[2m[36m(pid=31639)[0m non-resource variables are not supported in the long term
[2m[36m(pid=31637)[0m Instructions for updating:
[2m[36m(pid=31637)[0m non-resource variables are not supported in the long term
[2m[36m(pid=106690)[0m Instructions for updating:
[2m[36m(pid=106690)[0m non-resource variables are not supported in the long term
[2m[36m(pid=106689)[0m Instructions for updating:
[2m[36m(pid=106689)[0m non-resource variables are not supported in the long term


[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.1/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (100 PENDING, 50 RUNNING, 50 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=106689)[0m 2021-07-20 11:41:27,417	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=106690)[0m 2021-07-20 11:41:27,446	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=106719)[0m Instructions for updating:
[2m[36m(pid=106719)[0m non-resource variables are not supported in the long term
[2m[36m(pid=106737)[0m Instructions for updating:
[2m[36m(pid=106737)[0m non-resource variables are not supported in the long term
[2m[36m(pid=106739)[0m Instructions for updating:
[2m[36m(pid=106739)[0m non-resource variables are not supported in the long term
[2m[36m(pid=106740)[0m Instructions for updating:
[2m[36m(pid=106740)[0m non-resource variables are not supported in the long term


[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.1/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (94 PENDING, 50 RUNNING, 56 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=100486)[0m Instructions for updating:
[2m[36m(pid=100486)[0m non-resource variables are not supported in the long term
[2m[36m(pid=107349)[0m Instructions for updating:
[2m[36m(pid=107349)[0m non-resource variables are not supported in the long term
[2m[36m(pid=100486)[0m 2021-07-20 11:41:33,688	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=107444)[0m Instructions for updating:
[2m[36m(pid=107444)[0m non-resource variables are not supported in the long term
[2m[36m(pid=107349)[0m 2021-07-20 11:41:34,515	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=101883)[0m Instructions for updating:
[2m[36m(pid=101883)[0m non-resource variables are not supported in the long term
[2m[36m(pid=101881)[0m Instructions for updating:
[2m[36m(pid=101881)[0m n

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 12.7/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (86 PENDING, 49 RUNNING, 65 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=32680)[0m 2021-07-20 11:41:38,365	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=102008)[0m Instructions for updating:
[2m[36m(pid=102008)[0m non-resource variables are not supported in the long term
[2m[36m(pid=101944)[0m Instructions for updating:
[2m[36m(pid=101944)[0m non-resource variables are not supported in the long term
[2m[36m(pid=101953)[0m Instructions for updating:
[2m[36m(pid=101953)[0m non-resource variables are not supported in the long term
[2m[36m(pid=101953)[0m 2021-07-20 11:41:39,544	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=32681)[0m Instructions for updating:
[2m[36m(pid=32681)[0m non-resource variables are not supported in the long term
[2m[36m(pid=32671)[0m Instructions for updating:
[2m[36m(pid=32671)[0m non-re

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 15.5/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (73 PENDING, 49 RUNNING, 78 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=104707)[0m 2021-07-20 11:41:44,257	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=103240)[0m Instructions for updating:
[2m[36m(pid=103240)[0m non-resource variables are not supported in the long term
[2m[36m(pid=103178)[0m 2021-07-20 11:41:44,391	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=108256)[0m Instructions for updating:
[2m[36m(pid=108256)[0m non-resource variables are not supported in the long term
[2m[36m(pid=103280)[0m 2021-07-20 11:41:44,945	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=104709)[0m Instructions for updating:
[2m[36m(pid=104709)[0m non-resource variables are not supported in the long term
[2m[36m(pid=108254)[0m Instr

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.5/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (67 PENDING, 49 RUNNING, 84 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=33646)[0m Instructions for updating:
[2m[36m(pid=33646)[0m non-resource variables are not supported in the long term
[2m[36m(pid=33653)[0m Instructions for updating:
[2m[36m(pid=33653)[0m non-resource variables are not supported in the long term
[2m[36m(pid=33655)[0m Instructions for updating:
[2m[36m(pid=33655)[0m non-resource variables are not supported in the long term
[2m[36m(pid=33641)[0m Instructions for updating:
[2m[36m(pid=33641)[0m non-resource variables are not supported in the long term
[2m[36m(pid=33643)[0m Instructions for updating:
[2m[36m(pid=33643)[0m non-resource variables are not supported in the long term
[2m[36m(pid=33654)[0m 2021-07-20 11:41:50,619	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=34348)[0m Instructions for updating:
[2m[36m(pid=34348)[0m non-resource variables are not supported in the long term
[2m

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.2/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (56 PENDING, 49 RUNNING, 95 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=105965)[0m 2021-07-20 11:41:55,088	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=109505)[0m 2021-07-20 11:41:55,228	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=109519)[0m 2021-07-20 11:41:55,347	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=109564)[0m Instructions for updating:
[2m[36m(pid=109564)[0m non-resource variables are not supported in the long term
[2m[36m(pid=105957)[0m Instructions for updating:
[2m[36m(pid=105957)[0m non-resource variables are not supported in the long term
[2m[36m(pid=105953)[0m Instructions for updating:
[2m[36m(pid=105953)[0m non-resource variables are not supported in the long term
[2m[36m(pid=109521)[0m 2021-

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 13.6/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (50 PENDING, 50 RUNNING, 100 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=104275)[0m 2021-07-20 11:42:01,136	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=35363)[0m Instructions for updating:
[2m[36m(pid=35363)[0m non-resource variables are not supported in the long term
[2m[36m(pid=35373)[0m Instructions for updating:
[2m[36m(pid=35373)[0m non-resource variables are not supported in the long term
[2m[36m(pid=35476)[0m Instructions for updating:
[2m[36m(pid=35476)[0m non-resource variables are not supported in the long term
[2m[36m(pid=35347)[0m Instructions for updating:
[2m[36m(pid=35347)[0m non-resource variables are not supported in the long term
[2m[36m(pid=35369)[0m Instructions for updating:
[2m[36m(pid=35369)[0m non-resource variables are not supported in the long term
[2m[36m(pid=35398)[0m Instructions for updating:
[2m[36m(pid=35398)[0m non-resource variables are not supported in the long term
[2m

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.3/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (47 PENDING, 50 RUNNING, 103 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=105285)[0m Instructions for updating:
[2m[36m(pid=105285)[0m non-resource variables are not supported in the long term
[2m[36m(pid=105284)[0m Instructions for updating:
[2m[36m(pid=105284)[0m non-resource variables are not supported in the long term
[2m[36m(pid=111020)[0m Instructions for updating:
[2m[36m(pid=111020)[0m non-resource variables are not supported in the long term
[2m[36m(pid=111899)[0m Instructions for updating:
[2m[36m(pid=111899)[0m non-resource variables are not supported in the long term
[2m[36m(pid=105283)[0m Instructions for updating:
[2m[36m(pid=105283)[0m non-resource variables are not supported in the long term
[2m[36m(pid=107572)[0m Instructions for updating:
[2m[36m(pid=107572)[0m non-resource variables are not supported in the long term
[2m[36m(pid=107570)[0m Instructions for updating:
[2m[36m(pid=107570)[0m non-resource variables are not supported in the long term
[2m[36m(pid=107571)[0m Instructions fo

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.2/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (41 PENDING, 50 RUNNING, 109 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=112615)[0m 2021-07-20 11:42:12,016	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=105277)[0m 2021-07-20 11:42:12,401	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=105942)[0m Instructions for updating:
[2m[36m(pid=105942)[0m non-resource variables are not supported in the long term
[2m[36m(pid=105944)[0m Instructions for updating:
[2m[36m(pid=105944)[0m non-resource variables are not supported in the long term
[2m[36m(pid=105967)[0m Instructions for updating:
[2m[36m(pid=105967)[0m non-resource variables are not supported in the long term
[2m[36m(pid=112665)[0m Instructions for updating:
[2m[36m(pid=112665)[0m non-resource variables are not supported in the long term
[2m[36m(pid=112687)[0m Instructions for updating:
[2m[36m(pid=112687)[0m n

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 11.8/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (33 PENDING, 49 RUNNING, 118 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=36813)[0m 2021-07-20 11:42:16,609	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=106059)[0m Instructions for updating:
[2m[36m(pid=106059)[0m non-resource variables are not supported in the long term
[2m[36m(pid=36815)[0m 2021-07-20 11:42:16,772	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=36804)[0m 2021-07-20 11:42:16,736	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=105997)[0m Instructions for updating:
[2m[36m(pid=105997)[0m non-resource variables are not supported in the long term
[2m[36m(pid=106045)[0m Instructions for updating:
[2m[36m(pid=106045)[0m non-resource variables are not supported in the long term
[2m[36m(pid=105999)[0m Instruct

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.1/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (23 PENDING, 50 RUNNING, 127 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=113525)[0m Instructions for updating:
[2m[36m(pid=113525)[0m non-resource variables are not supported in the long term
[2m[36m(pid=106718)[0m 2021-07-20 11:42:21,683	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=106721)[0m Instructions for updating:
[2m[36m(pid=106721)[0m non-resource variables are not supported in the long term
[2m[36m(pid=106707)[0m Instructions for updating:
[2m[36m(pid=106707)[0m non-resource variables are not supported in the long term
[2m[36m(pid=109080)[0m Instructions for updating:
[2m[36m(pid=109080)[0m non-resource variables are not supported in the long term
[2m[36m(pid=109082)[0m Instructions for updating:
[2m[36m(pid=109082)[0m non-resource variables are not supported in the long term
[2m[36m(pid=106706)[0m Instructions for updating:
[2m[36m(pid=106706)[0m non-resource variables are not supported in the lo

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 12.7/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (18 PENDING, 49 RUNNING, 133 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=38583)[0m 2021-07-20 11:42:26,531	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=38681)[0m 2021-07-20 11:42:26,922	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=38683)[0m Instructions for updating:
[2m[36m(pid=38683)[0m non-resource variables are not supported in the long term
[2m[36m(pid=38682)[0m 2021-07-20 11:42:27,355	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=109878)[0m Instructions for updating:
[2m[36m(pid=109878)[0m non-resource variables are not supported in the long term
[2m[36m(pid=38683)[0m 2021-07-20 11:42:28,232	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.3/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (8 PENDING, 49 RUNNING, 143 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=110483)[0m Instructions for updating:
[2m[36m(pid=110483)[0m non-resource variables are not supported in the long term
[2m[36m(pid=110490)[0m 2021-07-20 11:42:31,950	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=110484)[0m Instructions for updating:
[2m[36m(pid=110484)[0m non-resource variables are not supported in the long term
[2m[36m(pid=952)[0m Instructions for updating:
[2m[36m(pid=952)[0m non-resource variables are not supported in the long term
[2m[36m(pid=110468)[0m Instructions for updating:
[2m[36m(pid=110468)[0m non-resource variables are not supported in the long term
[2m[36m(pid=110474)[0m Instructions for updating:
[2m[36m(pid=110474)[0m non-resource variables are not supported in the long term
[2m[36m(pid=956)[0m Instructions for updating:
[2m[36m(pid=956)[0m non-resource variables are not supported in the long term
[2m

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 13.6/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (1 PENDING, 50 RUNNING, 149 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=1704)[0m Instructions for updating:
[2m[36m(pid=1704)[0m non-resource variables are not supported in the long term
[2m[36m(pid=1707)[0m Instructions for updating:
[2m[36m(pid=1707)[0m non-resource variables are not supported in the long term
[2m[36m(pid=108282)[0m Instructions for updating:
[2m[36m(pid=108282)[0m non-resource variables are not supported in the long term
[2m[36m(pid=1746)[0m Instructions for updating:
[2m[36m(pid=1746)[0m non-resource variables are not supported in the long term
[2m[36m(pid=1821)[0m Instructions for updating:
[2m[36m(pid=1821)[0m non-resource variables are not supported in the long term
[2m[36m(pid=40250)[0m 2021-07-20 11:42:37,972	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=40279)[0m 2021-07-20 11:42:37,966	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' 

[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.3/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 135.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (45 RUNNING, 155 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 


[2m[36m(pid=2230)[0m Instructions for updating:
[2m[36m(pid=2230)[0m non-resource variables are not supported in the long term
[2m[36m(pid=2231)[0m Instructions for updating:
[2m[36m(pid=2231)[0m non-resource variables are not supported in the long term
[2m[36m(pid=108924)[0m Instructions for updating:
[2m[36m(pid=108924)[0m non-resource variables are not supported in the long term
[2m[36m(pid=108923)[0m Instructions for updating:
[2m[36m(pid=108923)[0m non-resource variables are not supported in the long term
[2m[36m(pid=111747)[0m 2021-07-20 11:42:43,011	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=111788)[0m Instructions for updating:
[2m[36m(pid=111788)[0m non-resource variables are not supported in the long term
[2m[36m(pid=111787)[0m Instructions for updating:
[2m[36m(pid=111787)[0m non-resource variables are not supported in the long term


[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 14.3/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 123.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (41 RUNNING, 159 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m == Status ==
[2m[36m(pid=25010)[0m Memory usage on this node: 12.5/187.6 GiB
[2m[36m(pid=25010)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=25010)[0m Resources requested: 93.0/152 CPUs, 0/0 GPUs, 0.0/512.14 GiB heap, 0.0/223.48 GiB objects
[2m[36m(pid=25010)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=25010)[0m Number of trials: 200/200 (31 RUNNING, 169 TERMINATED)
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m 
[2m[36m(pid=25010)[0m ==

[2m[36m(pid=25010)[0m 2021-07-20 11:43:19,814	INFO tune.py:549 -- Total run time: 174.98 seconds (174.73 seconds for the tuning loop).


<ray.tune.analysis.experiment_analysis.ExperimentAnalysis at 0x7ffdb2b48850>

In [10]:
analysis = tune.run(
    "PPO",
    stop={"episode_reward_max": 200},
    config={
        "framework": "torch",
        "env": "CartPole-v0",
        "lr": tune.grid_search([0.001, 0.002, 0.003, 0.004, 0.005]),
    },
    progress_reporter = JupyterNotebookReporter(True)
)

<IPython.core.display.HTML object>


[2m[36m(pid=110180)[0m Instructions for updating:
[2m[36m(pid=110180)[0m non-resource variables are not supported in the long term
[2m[36m(pid=40586)[0m Instructions for updating:
[2m[36m(pid=40586)[0m non-resource variables are not supported in the long term
[2m[36m(pid=110180)[0m 2021-05-25 10:04:22,637	INFO trainer.py:694 -- Current log_level is WARN. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=42854)[0m Instructions for updating:
[2m[36m(pid=42854)[0m non-resource variables are not supported in the long term
[2m[36m(pid=40586)[0m 2021-05-25 10:04:22,978	INFO trainer.py:694 -- Current log_level is WARN. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=34269)[0m Instructions for updating:
[2m[36m(pid=34269)[0m non-resource variables are not supported in the long term
[2m[36m(pid=2297)[0m Instructions for updating:
[2m[36m(pid=2297)[0m non-resource v

[2K[36m(pid=27027)[0m [2K
[2m[36m(pid=27027)[0m <IPython.core.display.HTML object>
<IPython.core.display.HTML object>
<IPython.core.display.HTML object>
<IPython.core.display.HTML object>
<IPython.core.display.HTML object>


[2m[36m(pid=27027)[0m 2021-05-25 10:04:54,258	INFO tune.py:549 -- Total run time: 34.48 seconds (34.15 seconds for the tuning loop).
[2m[36m(pid=42854)[0m 2021-05-25 10:04:54,221	ERROR worker.py:382 -- SystemExit was raised from the worker
[2m[36m(pid=42854)[0m Traceback (most recent call last):
[2m[36m(pid=42854)[0m   File "python/ray/_raylet.pyx", line 495, in ray._raylet.execute_task
[2m[36m(pid=42854)[0m   File "python/ray/_raylet.pyx", line 505, in ray._raylet.execute_task
[2m[36m(pid=42854)[0m   File "python/ray/_raylet.pyx", line 449, in ray._raylet.execute_task.function_executor
[2m[36m(pid=42854)[0m   File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/_private/function_manager.py", line 556, in actor_method_executor
[2m[36m(pid=42854)[0m     return method(__ray_actor, *args, **kwargs)
[2m[36m(pid=42854)[0m   File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/actor.py", line 1001, in __