# Setting up a Ray cluster with SmartSim

## 1. Start the cluster
We set up a SmartSim experiment, which will handle the launch of the Ray cluster.

First we import the relevant modules.

In [1]:
import numpy as np
import time
import argparse
import os

from ray.tune.progress_reporter import JupyterNotebookReporter
import ray
from ray import tune
import ray.util

from smartsim import Experiment
from smartsim.ray import RayCluster

NUM_WORKERS = 3
alloc=None
#alloc=slurm.get_allocation(nodes=1+NUM_WORKERS, time="12:00:00", options={"ntasks": str(1+NUM_WORKERS), "partition": "spider", "C": "V100"})

In [2]:
exp = Experiment("ray-cluster", launcher='slurm')
cluster = RayCluster(name="ray-cluster", run_args={}, path='',
                     launcher='slurm', workers=NUM_WORKERS, alloc=alloc, batch=True, ray_num_cpus=38)

if cluster.batch:
    cluster.head_model.batch_settings.add_preamble( ["source ~/.bashrc", "conda activate smartsim"])
    if NUM_WORKERS:
        cluster.worker_model.batch_settings.add_preamble ( ["source ~/.bashrc", "conda activate smartsim"])

exp.generate(cluster, overwrite=True)

10:01:37 horizon SmartSim[11054] INFO Working in previously created experiment


In [3]:
exp.start(cluster, block=False, summary=False)

10:01:49 horizon SmartSim[11054] INFO Ray cluster launched on nodes: ['nid00000', 'nid00002', 'nid00003', 'nid00001']


## 2. Start the ray driver script

In [6]:
#ray.util.connect(cluster.head_model.address +":10001")

tune.run(
    "PPO",
    stop={"episode_reward_max": 200},
    config={
        "framework": "torch",
        "env": "CartPole-v0",
        "num_gpus": 0,
        "lr": tune.grid_search(np.linspace (0.001, 0.01, 100).tolist()),
        "log_level": "ERROR",
    },
    local_dir="/lus/scratch/arigazzi/ray_local/",
    verbose=1,
    fail_fast=True,
    log_to_file=True,
)

[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 5.6/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (100 PENDING)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 


[2m[36m(pid=77627)[0m Instructions for updating:
[2m[36m(pid=77627)[0m non-resource variables are not supported in the long term
[2m[36m(pid=78171)[0m Instructions for updating:
[2m[36m(pid=78171)[0m non-resource variables are not supported in the long term
[2m[36m(pid=5756)[0m Instructions for updating:
[2m[36m(pid=5756)[0m non-resource variables are not supported in the long term
[2m[36m(pid=78172)[0m Instructions for updating:
[2m[36m(pid=78172)[0m non-resource variables are not supported in the long term
[2m[36m(pid=5763)[0m Instructions for updating:
[2m[36m(pid=5763)[0m non-resource variables are not supported in the long term
[2m[36m(pid=79309)[0m Instructions for updating:
[2m[36m(pid=79309)[0m non-resource variables are not supported in the long term
[2m[36m(pid=79326)[0m Instructions for updating:
[2m[36m(pid=79326)[0m non-resource variables are not supported in the long term
[2m[36m(pid=98116)[0m Instructions for updating:
[2m[3

[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 9.9/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (50 PENDING, 50 RUNNING)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 


[2m[36m(pid=78458)[0m 2021-05-26 08:59:40,054	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=78460)[0m 2021-05-26 08:59:40,064	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=78357)[0m 2021-05-26 08:59:40,076	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=78287)[0m 2021-05-26 08:59:40,073	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=78473)[0m 2021-05-26 08:59:40,079	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=5849)[0m 2021-05-26 08:59:40,126	INFO trainer.py:694 -- Curr

[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 14.2/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (50 PENDING, 50 RUNNING)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 14.2/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (50 PENDING, 50 RUNNING)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m == Status

[2m[36m(pid=78200)[0m Instructions for updating:
[2m[36m(pid=78200)[0m non-resource variables are not supported in the long term
[2m[36m(pid=78200)[0m 2021-05-26 09:00:05,127	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=5776)[0m Instructions for updating:
[2m[36m(pid=5776)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80178)[0m Instructions for updating:
[2m[36m(pid=80178)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80175)[0m Instructions for updating:
[2m[36m(pid=80175)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80195)[0m Instructions for updating:
[2m[36m(pid=80195)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80213)[0m Instructions for updating:
[2m[36m(pid=80213)[0m non-resource variables are not supported in the long term
[2m[3

[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 15.4/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (42 PENDING, 50 RUNNING, 8 TERMINATED)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 


[2m[36m(pid=7797)[0m 2021-05-26 09:00:08,885	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=81579)[0m 2021-05-26 09:00:09,163	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=7836)[0m Instructions for updating:
[2m[36m(pid=7836)[0m non-resource variables are not supported in the long term
[2m[36m(pid=7835)[0m Instructions for updating:
[2m[36m(pid=7835)[0m non-resource variables are not supported in the long term
[2m[36m(pid=101402)[0m Instructions for updating:
[2m[36m(pid=101402)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80196)[0m Instructions for updating:
[2m[36m(pid=80196)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80203)[0m Instructions for updating:
[2m[36m(pid=80203)[0m non-resource var

[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 14.3/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (33 PENDING, 49 RUNNING, 18 TERMINATED)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 


[2m[36m(pid=7826)[0m Instructions for updating:
[2m[36m(pid=7826)[0m non-resource variables are not supported in the long term
[2m[36m(pid=102227)[0m Instructions for updating:
[2m[36m(pid=102227)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80189)[0m 2021-05-26 09:00:14,296	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=82053)[0m 2021-05-26 09:00:14,575	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=8417)[0m Instructions for updating:
[2m[36m(pid=8417)[0m non-resource variables are not supported in the long term
[2m[36m(pid=7826)[0m 2021-05-26 09:00:14,986	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=82094)[0m Instructions for u

[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 10.5/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (6 PENDING, 50 RUNNING, 44 TERMINATED)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 


[2m[36m(pid=82782)[0m Instructions for updating:
[2m[36m(pid=82782)[0m non-resource variables are not supported in the long term
[2m[36m(pid=82719)[0m Instructions for updating:
[2m[36m(pid=82719)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80936)[0m Instructions for updating:
[2m[36m(pid=80936)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80970)[0m Instructions for updating:
[2m[36m(pid=80970)[0m non-resource variables are not supported in the long term
[2m[36m(pid=80972)[0m Instructions for updating:
[2m[36m(pid=80972)[0m non-resource variables are not supported in the long term
[2m[36m(pid=8861)[0m 2021-05-26 09:00:19,224	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=80941)[0m Instructions for updating:
[2m[36m(pid=80941)[0m non-resource variables are not supported in the long term
[2m[

[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 14.0/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (6 PENDING, 49 RUNNING, 45 TERMINATED)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 


[2m[36m(pid=104113)[0m Instructions for updating:
[2m[36m(pid=104113)[0m non-resource variables are not supported in the long term
[2m[36m(pid=8881)[0m Instructions for updating:
[2m[36m(pid=8881)[0m non-resource variables are not supported in the long term
[2m[36m(pid=81671)[0m Instructions for updating:
[2m[36m(pid=81671)[0m non-resource variables are not supported in the long term
[2m[36m(pid=83983)[0m Instructions for updating:
[2m[36m(pid=83983)[0m non-resource variables are not supported in the long term
[2m[36m(pid=83982)[0m Instructions for updating:
[2m[36m(pid=83982)[0m non-resource variables are not supported in the long term
[2m[36m(pid=9899)[0m Instructions for updating:
[2m[36m(pid=9899)[0m non-resource variables are not supported in the long term
[2m[36m(pid=8881)[0m 2021-05-26 09:00:28,448	INFO trainer.py:694 -- Current log_level is ERROR. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36

[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 14.3/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 150.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (50 RUNNING, 50 TERMINATED)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 


[2m[36m(pid=9944)[0m Instructions for updating:
[2m[36m(pid=9944)[0m non-resource variables are not supported in the long term
[2m[36m(pid=9942)[0m Instructions for updating:
[2m[36m(pid=9942)[0m non-resource variables are not supported in the long term
[2m[36m(pid=84099)[0m Instructions for updating:
[2m[36m(pid=84099)[0m non-resource variables are not supported in the long term
[2m[36m(pid=84119)[0m Instructions for updating:
[2m[36m(pid=84119)[0m non-resource variables are not supported in the long term
[2m[36m(pid=84081)[0m Instructions for updating:
[2m[36m(pid=84081)[0m non-resource variables are not supported in the long term
[2m[36m(pid=84112)[0m Instructions for updating:
[2m[36m(pid=84112)[0m non-resource variables are not supported in the long term
[2m[36m(pid=9933)[0m Instructions for updating:
[2m[36m(pid=9933)[0m non-resource variables are not supported in the long term
[2m[36m(pid=9945)[0m Instructions for updating:
[2m[36m(

[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 15.1/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 147.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (49 RUNNING, 51 TERMINATED)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 


[2m[36m(pid=105364)[0m Instructions for updating:
[2m[36m(pid=105364)[0m non-resource variables are not supported in the long term
[2m[36m(pid=105958)[0m Instructions for updating:
[2m[36m(pid=105958)[0m non-resource variables are not supported in the long term


[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 14.3/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 135.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (45 RUNNING, 55 TERMINATED)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m == Status ==
[2m[36m(pid=89496)[0m Memory usage on this node: 13.6/187.6 GiB
[2m[36m(pid=89496)[0m Using FIFO scheduling algorithm.
[2m[36m(pid=89496)[0m Resources requested: 105.0/152 CPUs, 0/0 GPUs, 0.0/512.37 GiB heap, 0.0/223.58 GiB objects
[2m[36m(pid=89496)[0m Result logdir: /lus/scratch/arigazzi/ray_local/PPO
[2m[36m(pid=89496)[0m Number of trials: 100/100 (35 RUNNING, 65 TERMINATED)
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m 
[2m[36m(pid=89496)[0m == 

[2m[36m(pid=105315)[0m 2021-05-26 09:01:11,317	ERROR worker.py:382 -- SystemExit was raised from the worker
[2m[36m(pid=105315)[0m Traceback (most recent call last):
[2m[36m(pid=105315)[0m   File "python/ray/_raylet.pyx", line 488, in ray._raylet.execute_task
[2m[36m(pid=105315)[0m   File "python/ray/_raylet.pyx", line 495, in ray._raylet.execute_task
[2m[36m(pid=105315)[0m   File "python/ray/_raylet.pyx", line 505, in ray._raylet.execute_task
[2m[36m(pid=105315)[0m   File "python/ray/_raylet.pyx", line 449, in ray._raylet.execute_task.function_executor
[2m[36m(pid=105315)[0m   File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/_private/function_manager.py", line 556, in actor_method_executor
[2m[36m(pid=105315)[0m     return method(__ray_actor, *args, **kwargs)
[2m[36m(pid=105315)[0m   File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/actor.py", line 1001, in __ray_terminate__
[2m[36m(pid=1

<ray.tune.analysis.experiment_analysis.ExperimentAnalysis at 0x7f1cdc43e370>

## 3. Stop cluster and release allocation

In [5]:
if alloc:
    slurm.release_allocation(alloc)

In [7]:
exp.stop(cluster)

09:04:54 horizon SmartSim[34190] INFO Stopping model workers with job name workers-CBN834UC8A6R
09:04:54 horizon SmartSim[34190] INFO Stopping model head with job name head-CBN831L2EAET


The autoscaler failed with the following error:
Terminated with signal 15
  File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/_private/monitor.py", line 376, in <module>
    monitor.run()
  File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/_private/monitor.py", line 284, in run
    self._run()
  File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/_private/monitor.py", line 202, in _run
    time.sleep(AUTOSCALER_UPDATE_INTERVAL_S)
  File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/_private/monitor.py", line 273, in _signal_handler
    "".join(traceback.format_stack(frame)))
  File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/traceback.py", line 197, in format_stack
    return format_list(extract_stack(f, limit=limit))
  File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/traceback.py", line 211, in extract_stack
    stack = 

In [9]:

tune.run(
    "PPO",
    stop={"episode_reward_max": 200},
    config={
        "framework": "torch",
        "env": "CartPole-v0",
    #    "num_gpus": 0,
        "lr": tune.grid_search(np.linspace (0.001, 0.01, 50).tolist()),
        "log_level": "ERROR",
    #    "num_cpus_per_worker": 1,
    },
    local_dir="/lus/scratch/arigazzi/ray_local/",
    verbose=1,
    #fail_fast=True,
    #log_to_file=True,
    progress_reporter = JupyterNotebookReporter(True),
)

<IPython.core.display.HTML object>


[2m[36m(pid=39779)[0m Instructions for updating:
[2m[36m(pid=39779)[0m non-resource variables are not supported in the long term
[2m[36m(pid=39781)[0m Instructions for updating:
[2m[36m(pid=39781)[0m non-resource variables are not supported in the long term
[2m[36m(pid=113189)[0m Instructions for updating:
[2m[36m(pid=113189)[0m non-resource variables are not supported in the long term
[2m[36m(pid=113188)[0m Instructions for updating:
[2m[36m(pid=113188)[0m non-resource variables are not supported in the long term
[2m[36m(pid=39780)[0m Instructions for updating:
[2m[36m(pid=39780)[0m non-resource variables are not supported in the long term
[2m[36m(pid=39774)[0m Instructions for updating:
[2m[36m(pid=39774)[0m non-resource variables are not supported in the long term
[2m[36m(pid=39770)[0m Instructions for updating:
[2m[36m(pid=39770)[0m non-resource variables are not supported in the long term
[2m[36m(pid=113191)[0m Instructions for updating

<IPython.core.display.HTML object>
<IPython.core.display.HTML object>
<IPython.core.display.HTML object>
<IPython.core.display.HTML object>
[2K[36m(pid=27027)[0m [2K
[2m[36m(pid=27027)[0m <IPython.core.display.HTML object>
<IPython.core.display.HTML object>
<IPython.core.display.HTML object>


[2m[36m(pid=27027)[0m 2021-05-25 10:02:22,533	INFO tune.py:549 -- Total run time: 55.35 seconds (55.19 seconds for the tuning loop).


<ray.tune.analysis.experiment_analysis.ExperimentAnalysis at 0x7fd356fd07c0>

In [10]:
analysis = tune.run(
    "PPO",
    stop={"episode_reward_max": 200},
    config={
        "framework": "torch",
        "env": "CartPole-v0",
        "lr": tune.grid_search([0.001, 0.002, 0.003, 0.004, 0.005]),
    },
    progress_reporter = JupyterNotebookReporter(True)
)

<IPython.core.display.HTML object>


[2m[36m(pid=110180)[0m Instructions for updating:
[2m[36m(pid=110180)[0m non-resource variables are not supported in the long term
[2m[36m(pid=40586)[0m Instructions for updating:
[2m[36m(pid=40586)[0m non-resource variables are not supported in the long term
[2m[36m(pid=110180)[0m 2021-05-25 10:04:22,637	INFO trainer.py:694 -- Current log_level is WARN. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=42854)[0m Instructions for updating:
[2m[36m(pid=42854)[0m non-resource variables are not supported in the long term
[2m[36m(pid=40586)[0m 2021-05-25 10:04:22,978	INFO trainer.py:694 -- Current log_level is WARN. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.
[2m[36m(pid=34269)[0m Instructions for updating:
[2m[36m(pid=34269)[0m non-resource variables are not supported in the long term
[2m[36m(pid=2297)[0m Instructions for updating:
[2m[36m(pid=2297)[0m non-resource v

[2K[36m(pid=27027)[0m [2K
[2m[36m(pid=27027)[0m <IPython.core.display.HTML object>
<IPython.core.display.HTML object>
<IPython.core.display.HTML object>
<IPython.core.display.HTML object>
<IPython.core.display.HTML object>


[2m[36m(pid=27027)[0m 2021-05-25 10:04:54,258	INFO tune.py:549 -- Total run time: 34.48 seconds (34.15 seconds for the tuning loop).
[2m[36m(pid=42854)[0m 2021-05-25 10:04:54,221	ERROR worker.py:382 -- SystemExit was raised from the worker
[2m[36m(pid=42854)[0m Traceback (most recent call last):
[2m[36m(pid=42854)[0m   File "python/ray/_raylet.pyx", line 495, in ray._raylet.execute_task
[2m[36m(pid=42854)[0m   File "python/ray/_raylet.pyx", line 505, in ray._raylet.execute_task
[2m[36m(pid=42854)[0m   File "python/ray/_raylet.pyx", line 449, in ray._raylet.execute_task.function_executor
[2m[36m(pid=42854)[0m   File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/_private/function_manager.py", line 556, in actor_method_executor
[2m[36m(pid=42854)[0m     return method(__ray_actor, *args, **kwargs)
[2m[36m(pid=42854)[0m   File "/lus/scratch/arigazzi/anaconda3/envs/smartsim/lib/python3.8/site-packages/ray/actor.py", line 1001, in __