In [1]:
import torch.optim as optim
from ray import tune
from ray.tune import track
from ray.tune.schedulers import ASHAScheduler
from ray.tune.examples.mnist_pytorch import get_data_loaders, ConvNet, train, test

from dpdqn_v2 import DPDQN2
import os
import gym
import numpy as np
import matplotlib.pyplot as plt

from shutil import copyfile
from utils import *
import pickle
import pandas as pd

import datetime

In [2]:
# test 1 on server

In [3]:
%%time
exp_name="server_tune_" + datetime.datetime.now().strftime("%Y_%B_%d_%I_%M%p")

def train_DPDQN(config):
    time_steps = 1e6 #testrun
    envname = "BipedalWalker-v2"
    env = gym.make(envname)
    model = DPDQN2(env, verbose=0, ray_tune=True, 
                  batch_size=config["batch_size"], num_action_samples_final=config["num_action_samples_final"],
                   hidden_size2=config["hidden_size2"]
                  )
    model.learn(total_timesteps=int(time_steps))
    

search_space={
    "batch_size": tune.grid_search([16, 32]),
    "num_action_samples_final": tune.grid_search([11, 13, 16]),
    "hidden_size2": tune.grid_search([16, 32]),
}

analysis = tune.run(
    train_DPDQN,
    name=exp_name,
    config=search_space,
    resources_per_trial={"cpu": 1, "gpu": 0}
)

print("Best config: ", analysis.get_best_config(metric="mean_reward"))

dfs = analysis.trial_dataframes
pickle.dump(dfs, open("tune_results.p", "wb"), pickle.HIGHEST_PROTOCOL)


#tensorboard --logdir ~/ray_results

2019-11-17 18:26:23,758	INFO resource_spec.py:205 -- Starting Ray with 3.52 GiB memory available for workers and up to 1.76 GiB for objects. You can adjust these settings with ray.init(memory=<bytes>, object_store_memory=<bytes>).
2019-11-17 18:26:24,542	INFO function_runner.py:254 -- tune.track signature detected.


== Status ==
Using FIFO scheduling algorithm.
Resources requested: 0/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.4/16.0 GiB

== Status ==
Using FIFO scheduling algorithm.
Resources requested: 1/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.8/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 1, 'PENDING': 5})
PENDING trials:
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	PENDING
 - train_DPDQN_2_batch_size=16,num_action_samples_final=13:	PENDING
 - train_DPDQN_3_batch_size=32,num_action_samples_final=13:	PENDING
 - train_DPDQN_4_batch_size=16,num_action_samples_final=16:	PENDING
 - train_DPDQN_5_batch_size=32,num_action_samples_final=16:	PENDING
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING

Result for train_DPDQN_1_batch_size=32,num_action_samples_final=11:
  date: 2019

Result for train_DPDQN_0_batch_size=16,num_action_samples_final=11:
  date: 2019-11-17_18-33-31
  done: false
  experiment_id: 37b314b1c99048628be50f56fe9079f5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 2
  mean_reward: -115.16971490711597
  node_ip: 192.168.0.11
  pid: 53574
  time_since_restore: 421.5475399494171
  time_this_iter_s: 406.9761862754822
  time_total_s: 421.5475399494171
  timestamp: 1574004811
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: 9daba08c
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 421 s, 1 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	RUN

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_18-40-09
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 3
  mean_reward: -108.75512040178563
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 819.4494960308075
  time_this_iter_s: 387.382287979126
  time_total_s: 819.4494960308075
  timestamp: 1574005209
  timesteps_since_restore: 0
  training_iteration: 2
  trial_id: 9dae5818
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 808 s, 2 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	RUNN

Result for train_DPDQN_3_batch_size=32,num_action_samples_final=13:
  date: 2019-11-17_18-53-17
  done: false
  experiment_id: 81be98b074f94c8ba21d466ff110ffc7
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 3
  mean_reward: -112.68989252508511
  node_ip: 192.168.0.11
  pid: 53578
  time_since_restore: 1607.5648639202118
  time_this_iter_s: 845.2954161167145
  time_total_s: 1607.5648639202118
  timestamp: 1574005997
  timesteps_since_restore: 0
  training_iteration: 2
  trial_id: 9dae8676
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.8/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 1232 s, 3 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_19-03-10
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 6
  mean_reward: -127.07428840831012
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 2200.706253051758
  time_this_iter_s: 429.17781615257263
  time_total_s: 2200.706253051758
  timestamp: 1574006590
  timesteps_since_restore: 0
  training_iteration: 5
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 2106 s, 5 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	R

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_19-11-04
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 7
  mean_reward: -47.39453606233561
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 2674.985541820526
  time_this_iter_s: 474.2792887687683
  time_total_s: 2674.985541820526
  timestamp: 1574007064
  timesteps_since_restore: 0
  training_iteration: 6
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 2583 s, 6 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	RUN

Result for train_DPDQN_0_batch_size=16,num_action_samples_final=11:
  date: 2019-11-17_19-22-37
  done: false
  experiment_id: 37b314b1c99048628be50f56fe9079f5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 9
  mean_reward: -103.88810161990625
  node_ip: 192.168.0.11
  pid: 53574
  time_since_restore: 3367.686164855957
  time_this_iter_s: 389.58097410202026
  time_total_s: 3367.686164855957
  timestamp: 1574007757
  timesteps_since_restore: 0
  training_iteration: 8
  trial_id: 9daba08c
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.6/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 3367 s, 8 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	R

Result for train_DPDQN_5_batch_size=32,num_action_samples_final=16:
  date: 2019-11-17_19-30-42
  done: false
  experiment_id: 4ea8c7a406a34f1aacfa0aad3980162e
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 6
  mean_reward: -119.0998070924805
  node_ip: 192.168.0.11
  pid: 53571
  time_since_restore: 3852.9713249206543
  time_this_iter_s: 724.3520228862762
  time_total_s: 3852.9713249206543
  timestamp: 1574008242
  timesteps_since_restore: 0
  training_iteration: 5
  trial_id: 9daee11e
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 3745 s, 9 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	R

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_19-41-44
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 12
  mean_reward: -92.35569570293235
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 4514.646391153336
  time_this_iter_s: 378.09564900398254
  time_total_s: 4514.646391153336
  timestamp: 1574008904
  timesteps_since_restore: 0
  training_iteration: 11
  trial_id: 9dae5818
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 4123 s, 10 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_19-50-27
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 13
  mean_reward: -100.72204651194227
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 5037.786816835403
  time_this_iter_s: 390.2484829425812
  time_total_s: 5037.786816835403
  timestamp: 1574009427
  timesteps_since_restore: 0
  training_iteration: 12
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 4938 s, 12 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_20-00-45
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 15
  mean_reward: -114.51578811619471
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 5655.542188167572
  time_this_iter_s: 378.464231967926
  time_total_s: 5655.542188167572
  timestamp: 1574010045
  timesteps_since_restore: 0
  training_iteration: 14
  trial_id: 9dae5818
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 5315 s, 13 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_20-07-50
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 16
  mean_reward: -66.63863877775073
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 6080.788197278976
  time_this_iter_s: 425.2460091114044
  time_total_s: 6080.788197278976
  timestamp: 1574010470
  timesteps_since_restore: 0
  training_iteration: 15
  trial_id: 9dae5818
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 5688 s, 14 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	

Result for train_DPDQN_1_batch_size=32,num_action_samples_final=11:
  date: 2019-11-17_20-17-40
  done: false
  experiment_id: dfc68ade8222420897740de41e41206d
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 10
  mean_reward: -82.20203273552879
  node_ip: 192.168.0.11
  pid: 53570
  time_since_restore: 6670.59841299057
  time_this_iter_s: 741.7851419448853
  time_total_s: 6670.59841299057
  timestamp: 1574011060
  timesteps_since_restore: 0
  training_iteration: 9
  trial_id: 9dae1952
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 6486 s, 16 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	RUN

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_20-27-25
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 19
  mean_reward: -107.93125556787977
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 7255.793787956238
  time_this_iter_s: 382.1369700431824
  time_total_s: 7255.793787956238
  timestamp: 1574011645
  timesteps_since_restore: 0
  training_iteration: 18
  trial_id: 9dae5818
  
Result for train_DPDQN_1_batch_size=32,num_action_samples_final=11:
  date: 2019-11-17_20-29-10
  done: false
  experiment_id: dfc68ade8222420897740de41e41206d
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 11
  mean_reward: -118.77482131623243
  node_ip: 192.168.0.11
  pid: 53570
  time_since_restore: 7360.8201541900635
  time_this_iter_s: 690.2217411994934
  time_total_s: 7360.8201541900635
  timestamp: 1574011750
  timesteps_since_restore: 0
  training_iteratio

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_20-36-58
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 20
  mean_reward: -110.05142778696377
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 7829.0018627643585
  time_this_iter_s: 429.49467277526855
  time_total_s: 7829.0018627643585
  timestamp: 1574012218
  timesteps_since_restore: 0
  training_iteration: 19
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 7641 s, 19 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=

Result for train_DPDQN_3_batch_size=32,num_action_samples_final=13:
  date: 2019-11-17_20-44-28
  done: false
  experiment_id: 81be98b074f94c8ba21d466ff110ffc7
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 12
  mean_reward: -118.3814042859343
  node_ip: 192.168.0.11
  pid: 53578
  time_since_restore: 8278.87091088295
  time_this_iter_s: 778.5927879810333
  time_total_s: 8278.87091088295
  timestamp: 1574012668
  timesteps_since_restore: 0
  training_iteration: 11
  trial_id: 9dae8676
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 8050 s, 20 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	RU

Result for train_DPDQN_5_batch_size=32,num_action_samples_final=16:
  date: 2019-11-17_20-54-58
  done: false
  experiment_id: 4ea8c7a406a34f1aacfa0aad3980162e
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 13
  mean_reward: -112.2699987081166
  node_ip: 192.168.0.11
  pid: 53571
  time_since_restore: 8909.018280982971
  time_this_iter_s: 732.8160181045532
  time_total_s: 8909.018280982971
  timestamp: 1574013298
  timesteps_since_restore: 0
  training_iteration: 12
  trial_id: 9daee11e
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 8857 s, 22 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:	

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_21-02-53
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 24
  mean_reward: -111.5090377778365
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 9384.058041095734
  time_this_iter_s: 391.48955821990967
  time_total_s: 9384.058041095734
  timestamp: 1574013773
  timesteps_since_restore: 0
  training_iteration: 23
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.7/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 9294 s, 23 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:

Result for train_DPDQN_3_batch_size=32,num_action_samples_final=13:
  date: 2019-11-17_21-09-56
  done: false
  experiment_id: 81be98b074f94c8ba21d466ff110ffc7
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 14
  mean_reward: -105.49563287712856
  node_ip: 192.168.0.11
  pid: 53578
  time_since_restore: 9806.898713111877
  time_this_iter_s: 784.4405109882355
  time_total_s: 9806.898713111877
  timestamp: 1574014196
  timesteps_since_restore: 0
  training_iteration: 13
  trial_id: 9dae8676
  
Result for train_DPDQN_0_batch_size=16,num_action_samples_final=11:
  date: 2019-11-17_21-14-30
  done: false
  experiment_id: 37b314b1c99048628be50f56fe9079f5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 26
  mean_reward: -122.04306381962179
  node_ip: 192.168.0.11
  pid: 53574
  time_since_restore: 10080.737330913544
  time_this_iter_s: 396.34431529045105
  time_total_s: 10080.737330913544
  timestamp: 1574014470
  timesteps_since_restore: 0
  training_iterati

Result for train_DPDQN_3_batch_size=32,num_action_samples_final=13:
  date: 2019-11-17_21-22-28
  done: false
  experiment_id: 81be98b074f94c8ba21d466ff110ffc7
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 15
  mean_reward: -120.21566672576235
  node_ip: 192.168.0.11
  pid: 53578
  time_since_restore: 10558.79209804535
  time_this_iter_s: 751.8933849334717
  time_total_s: 10558.79209804535
  timestamp: 1574014948
  timesteps_since_restore: 0
  training_iteration: 14
  trial_id: 9dae8676
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 10487 s, 26 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_21-31-27
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 28
  mean_reward: 189.8968415144087
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 11097.577762126923
  time_this_iter_s: 433.9646170139313
  time_total_s: 11097.577762126923
  timestamp: 1574015487
  timesteps_since_restore: 0
  training_iteration: 27
  trial_id: 9dae5818
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 10908 s, 27 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11

Result for train_DPDQN_0_batch_size=16,num_action_samples_final=11:
  date: 2019-11-17_21-42-56
  done: false
  experiment_id: 37b314b1c99048628be50f56fe9079f5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 30
  mean_reward: -53.309128873751625
  node_ip: 192.168.0.11
  pid: 53574
  time_since_restore: 11786.822028636932
  time_this_iter_s: 442.9969148635864
  time_total_s: 11786.822028636932
  timestamp: 1574016176
  timesteps_since_restore: 0
  training_iteration: 29
  trial_id: 9daba08c
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.6/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 11786 s, 29 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_21-50-38
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 31
  mean_reward: -109.44706076151029
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 12248.713082075119
  time_this_iter_s: 401.94311809539795
  time_total_s: 12248.713082075119
  timestamp: 1574016638
  timesteps_since_restore: 0
  training_iteration: 30
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 12235 s, 30 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_22-00-30
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 32
  mean_reward: 2.971373935942514
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 12840.547900915146
  time_this_iter_s: 420.8556978702545
  time_total_s: 12840.547900915146
  timestamp: 1574017230
  timesteps_since_restore: 0
  training_iteration: 31
  trial_id: 9dae5818
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 12680 s, 31 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_22-10-52
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 34
  mean_reward: -116.29758926103223
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 13462.666501760483
  time_this_iter_s: 406.5158808231354
  time_total_s: 13462.666501760483
  timestamp: 1574017852
  timesteps_since_restore: 0
  training_iteration: 33
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.3/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 13124 s, 32 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=

Result for train_DPDQN_1_batch_size=32,num_action_samples_final=11:
  date: 2019-11-17_22-18-57
  done: false
  experiment_id: dfc68ade8222420897740de41e41206d
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 20
  mean_reward: -111.68853227417854
  node_ip: 192.168.0.11
  pid: 53570
  time_since_restore: 13948.26812696457
  time_this_iter_s: 728.0900919437408
  time_total_s: 13948.26812696457
  timestamp: 1574018337
  timesteps_since_restore: 0
  training_iteration: 19
  trial_id: 9dae1952
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.4/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 13568 s, 33 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_22-28-17
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 36
  mean_reward: -11.957715365628417
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 14507.781413078308
  time_this_iter_s: 418.2619240283966
  time_total_s: 14507.781413078308
  timestamp: 1574018897
  timesteps_since_restore: 0
  training_iteration: 35
  trial_id: 9dae5818
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.4/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 14393 s, 35 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_22-38-24
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 38
  mean_reward: -191.04137955516788
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 15114.986478090286
  time_this_iter_s: 428.4502902030945
  time_total_s: 15114.986478090286
  timestamp: 1574019504
  timesteps_since_restore: 0
  training_iteration: 37
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.4/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 14804 s, 36 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=

Result for train_DPDQN_0_batch_size=16,num_action_samples_final=11:
  date: 2019-11-17_22-46-36
  done: false
  experiment_id: 37b314b1c99048628be50f56fe9079f5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 39
  mean_reward: -100.08045874648546
  node_ip: 192.168.0.11
  pid: 53574
  time_since_restore: 15606.52949500084
  time_this_iter_s: 399.42820501327515
  time_total_s: 15606.52949500084
  timestamp: 1574019996
  timesteps_since_restore: 0
  training_iteration: 38
  trial_id: 9daba08c
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.4/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 15606 s, 38 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=1

Result for train_DPDQN_1_batch_size=32,num_action_samples_final=11:
  date: 2019-11-17_22-55-05
  done: false
  experiment_id: dfc68ade8222420897740de41e41206d
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 23
  mean_reward: -97.7077242124211
  node_ip: 192.168.0.11
  pid: 53570
  time_since_restore: 16115.600855112076
  time_this_iter_s: 714.146420955658
  time_total_s: 16115.600855112076
  timestamp: 1574020505
  timesteps_since_restore: 0
  training_iteration: 22
  trial_id: 9dae1952
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 16017 s, 39 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11:

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_23-04-35
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 41
  mean_reward: -109.68424556692385
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 16686.11230325699
  time_this_iter_s: 431.6360421180725
  time_total_s: 16686.11230325699
  timestamp: 1574021075
  timesteps_since_restore: 0
  training_iteration: 40
  trial_id: 9dae5818
  
Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_23-05-12
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 42
  mean_reward: -89.88369104042802
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 16722.892093896866
  time_this_iter_s: 398.71823287010193
  time_total_s: 16722.892093896866
  timestamp: 1574021112
  timesteps_since_restore: 0
  training_iteratio

Result for train_DPDQN_5_batch_size=32,num_action_samples_final=16:
  date: 2019-11-17_23-14-08
  done: false
  experiment_id: 4ea8c7a406a34f1aacfa0aad3980162e
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 24
  mean_reward: -70.86530035987157
  node_ip: 192.168.0.11
  pid: 53571
  time_since_restore: 17258.402416944504
  time_this_iter_s: 778.1533370018005
  time_total_s: 17258.402416944504
  timestamp: 1574021648
  timesteps_since_restore: 0
  training_iteration: 23
  trial_id: 9daee11e
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 17189 s, 42 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=1

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_23-25-26
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 45
  mean_reward: -123.90959526199119
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 17937.13147687912
  time_this_iter_s: 386.9623649120331
  time_total_s: 17937.13147687912
  timestamp: 1574022326
  timesteps_since_restore: 0
  training_iteration: 44
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.4/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 17595 s, 43 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11

Result for train_DPDQN_2_batch_size=16,num_action_samples_final=13:
  date: 2019-11-17_23-32-17
  done: false
  experiment_id: c3527cba03e249f8a560644386cc4f12
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 45
  mean_reward: -101.4098300809142
  node_ip: 192.168.0.11
  pid: 53575
  time_since_restore: 18347.734462976456
  time_this_iter_s: 409.7825527191162
  time_total_s: 18347.734462976456
  timestamp: 1574022737
  timesteps_since_restore: 0
  training_iteration: 44
  trial_id: 9dae5818
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 17987 s, 44 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=1

Result for train_DPDQN_3_batch_size=32,num_action_samples_final=13:
  date: 2019-11-17_23-42-55
  done: false
  experiment_id: 81be98b074f94c8ba21d466ff110ffc7
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 26
  mean_reward: -101.00369844635271
  node_ip: 192.168.0.11
  pid: 53578
  time_since_restore: 18985.728666067123
  time_this_iter_s: 783.7503552436829
  time_total_s: 18985.728666067123
  timestamp: 1574023375
  timesteps_since_restore: 0
  training_iteration: 25
  trial_id: 9dae8676
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.5/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 18797 s, 46 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=

Result for train_DPDQN_4_batch_size=16,num_action_samples_final=16:
  date: 2019-11-17_23-53-15
  done: false
  experiment_id: 69ea6546e9db453c92ac8344ebf895c5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 49
  mean_reward: -102.58969692315246
  node_ip: 192.168.0.11
  pid: 53572
  time_since_restore: 19606.22441482544
  time_this_iter_s: 446.89792490005493
  time_total_s: 19606.22441482544
  timestamp: 1574023995
  timesteps_since_restore: 0
  training_iteration: 48
  trial_id: 9daeb2b8
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 10.4/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 19217 s, 47 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=1

Result for train_DPDQN_0_batch_size=16,num_action_samples_final=11:
  date: 2019-11-18_00-02-59
  done: false
  experiment_id: 37b314b1c99048628be50f56fe9079f5
  hostname: Aydars-MacBook-Pro.local
  iterations_since_restore: 50
  mean_reward: -98.34136560330653
  node_ip: 192.168.0.11
  pid: 53574
  time_since_restore: 20189.586211681366
  time_this_iter_s: 532.9112749099731
  time_total_s: 20189.586211681366
  timestamp: 1574024579
  timesteps_since_restore: 0
  training_iteration: 49
  trial_id: 9daba08c
  
== Status ==
Using FIFO scheduling algorithm.
Resources requested: 6/12 CPUs, 0/0 GPUs, 0.0/3.52 GiB heap, 0.0/1.17 GiB objects
Memory usage on this node: 9.8/16.0 GiB
Result logdir: /Users/aydarakhmetzyanov/ray_results/server_tune_2019_November_17_06_26PM
Number of trials: 6 ({'RUNNING': 6})
RUNNING trials:
 - train_DPDQN_0_batch_size=16,num_action_samples_final=11:	RUNNING, [1 CPUs, 0 GPUs], [pid=53574], 20189 s, 49 iter
 - train_DPDQN_1_batch_size=32,num_action_samples_final=11

RayletError: The Raylet died with this message: [RayletClient] Raylet connection closed.

In [4]:
#dfs=pickle.load(open("tune_results.p", "rb"))
ax = None  # This plots everything on the same plot
for d in dfs.values():
    ax = d.mean_accuracy.plot(ax=ax, legend=False)
    
#tensorboard --logdir ~/ray_results

NameError: name 'dfs' is not defined

In [None]:
#tensorboard  --host 0.0.0.0 —port 6006 --logdir ~/ray_results/server_tune_2019_November_14_10_10PM