#TODO: 

- Introduction
- Explain ray config

# RayTune Dashboard: 

When Ray is running on a (not portforwarded, dutch) server, accessing the Ray dashboard is done as follows. Given this example warning of Ray: 


`2020-11-04 17:00:40,912	INFO services.py:1166 -- View the Ray dashboard at http://127.0.0.1:8265`


The dashboard is accessed by opening a ssh tunnel to this port. This is done by running `ssh -NL 8265:localhost:8265 username@gpuserver.hhs.nl` in a terminal (e.g. powershell in Windows) on your computer. Once logged in you can acces the Dashboard in your webbrowser by going to `localhost:8265`.

In [1]:
from functools import partial
import numpy as np
import os
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
from torch.utils.data import random_split
import torchvision
import torchvision.transforms as transforms
import ray
from ray import tune
from ray.tune import CLIReporter
from ray.tune.schedulers import ASHAScheduler


"""
Ray config explanation.
"""


# ray config
total_num_cpus = 40 # total number of cpus to use
total_num_gpus = 4 # total numbers of gpus to use

num_gpus = 0.25 # number of gpus per trial
num_workers = 2 # number workers & number of processes for dataloaders
num_cpus_for_driver = 1 # number of cpus for driver
num_cpus_per_worker = 1 # number of cpus per worker

# Each trial uses num_cpus_per_worker * num_workers + num_cpus_for_driver CPU's

ray.shutdown()
ray.init(num_cpus=total_num_cpus, num_gpus=total_num_gpus, dashboard_port=8265) # set to your preferred (non occupied) port to have a fixed port

2020-11-13 14:48:12,805	INFO services.py:1166 -- View the Ray dashboard at [1m[32mhttp://127.0.0.1:8266[39m[22m


{'node_ip_address': '145.52.252.20',
 'raylet_ip_address': '145.52.252.20',
 'redis_address': '145.52.252.20:6379',
 'object_store_address': '/tmp/ray/session_2020-11-13_14-48-12_253320_5246/sockets/plasma_store',
 'raylet_socket_name': '/tmp/ray/session_2020-11-13_14-48-12_253320_5246/sockets/raylet',
 'webui_url': '127.0.0.1:8266',
 'session_dir': '/tmp/ray/session_2020-11-13_14-48-12_253320_5246',
 'metrics_export_port': 51745}

In [2]:
n_cpus_per_trial = num_cpus_per_worker*num_workers + num_cpus_for_driver

print("Using %s CPUs per trial." % (n_cpus_per_trial))
print("We are able to run %s trials in parallel (disregarding gpu limitations)." % (total_num_cpus // n_cpus_per_trial))

Using 3 CPUs per trial.
We are able to run 13 trials in parallel (disregarding gpu limitations).


# Shared definitions between trials

In [3]:
def load_data(data_dir="./data"):
    """
    Loads and normalises CIFAR10 data.
    """
    transform = transforms.Compose([
        transforms.ToTensor(),
        transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
    ])
    
    trainset = torchvision.datasets.CIFAR10(
        root=data_dir, train=True, download=True, transform=transform)

    testset = torchvision.datasets.CIFAR10(
        root=data_dir, train=False, download=True, transform=transform)

    return trainset, testset


def test_accuracy(net, device="cpu"):
    """
    A function to compute the test accuracy
    """
    trainset, testset = load_data()

    testloader = torch.utils.data.DataLoader(
        testset, batch_size=4, shuffle=False, num_workers=num_workers)

    correct = 0
    total = 0
    with torch.no_grad():
        for data in testloader:
            images, labels = data
            images, labels = images.to(device), labels.to(device)
            outputs = net(images)
            _, predicted = torch.max(outputs.data, 1)
            total += labels.size(0)
            correct += (predicted == labels).sum().item()

    return correct / total

In [4]:
class Net(nn.Module):
    def __init__(self, l1=120, l2=84):
        super(Net, self).__init__()
        self.conv1 = nn.Conv2d(3, 6, 5)
        self.pool = nn.MaxPool2d(2, 2)
        self.conv2 = nn.Conv2d(6, 16, 5)
        self.fc1 = nn.Linear(16 * 5 * 5, l1)
        self.fc2 = nn.Linear(l1, l2)
        self.fc3 = nn.Linear(l2, 10)

    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x)))
        x = self.pool(F.relu(self.conv2(x)))
        x = x.view(-1, 16 * 5 * 5)
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = self.fc3(x)
        return x

In [5]:
def train_cifar(config, checkpoint_dir=None, data_dir=None):
    net = Net(config["l1"], config["l2"])

    device = "cpu"
    if torch.cuda.is_available():
        device = "cuda:0"
        if torch.cuda.device_count() > 1:
            net = nn.DataParallel(net)
    net.to(device)

    criterion = nn.CrossEntropyLoss()
    optimizer = optim.SGD(net.parameters(), lr=config["lr"], momentum=0.9)

    if checkpoint_dir:
        model_state, optimizer_state = torch.load(
            os.path.join(checkpoint_dir, "checkpoint"))
        net.load_state_dict(model_state)
        optimizer.load_state_dict(optimizer_state)

    trainset, testset = load_data(data_dir)

    test_abs = int(len(trainset) * 0.8)
    train_subset, val_subset = random_split(
        trainset, [test_abs, len(trainset) - test_abs])

    trainloader = torch.utils.data.DataLoader(
        train_subset,
        batch_size=int(config["batch_size"]),
        shuffle=True,
        num_workers=num_workers)
    valloader = torch.utils.data.DataLoader(
        val_subset,
        batch_size=int(config["batch_size"]),
        shuffle=True,
        num_workers=num_workers)

    for epoch in range(10):  # loop over the dataset multiple times
        running_loss = 0.0
        epoch_steps = 0
        for i, data in enumerate(trainloader, 0):
            # get the inputs; data is a list of [inputs, labels]
            inputs, labels = data
            inputs, labels = inputs.to(device), labels.to(device)

            # zero the parameter gradients
            optimizer.zero_grad()

            # forward + backward + optimize
            outputs = net(inputs)
            loss = criterion(outputs, labels)
            loss.backward()
            optimizer.step()

            # print statistics
            running_loss += loss.item()
            epoch_steps += 1
            if i % 2000 == 1999:  # print every 2000 mini-batches
                print("[%d, %5d] loss: %.3f" % (epoch + 1, i + 1,
                                                running_loss / epoch_steps))
                running_loss = 0.0

        # Validation loss
        val_loss = 0.0
        val_steps = 0
        total = 0
        correct = 0
        for i, data in enumerate(valloader, 0):
            with torch.no_grad():
                inputs, labels = data
                inputs, labels = inputs.to(device), labels.to(device)

                outputs = net(inputs)
                _, predicted = torch.max(outputs.data, 1)
                total += labels.size(0)
                correct += (predicted == labels).sum().item()

                loss = criterion(outputs, labels)
                val_loss += loss.cpu().numpy()
                val_steps += 1

        with tune.checkpoint_dir(epoch) as checkpoint_dir:
            path = os.path.join(checkpoint_dir, "checkpoint")
            torch.save((net.state_dict(), optimizer.state_dict()), path)

        tune.report(loss=(val_loss / val_steps), accuracy=correct / total)
    print("Finished Training")

In [6]:
# Main

In [7]:
def main(num_samples=10, max_num_epochs=10, gpus_per_trial=2):
    data_dir = os.path.abspath("./data")
    load_data(data_dir)
    
    config = {
        "num_gpus": num_gpus,
        "num_cpus_for_driver": num_cpus_for_driver,
        "num_cpus_per_worker": num_cpus_per_worker,
        "num_workers": num_workers,
        "l1": tune.sample_from(lambda _: 2 ** np.random.randint(2, 9)),
        "l2": tune.sample_from(lambda _: 2 ** np.random.randint(2, 9)),
        "lr": tune.loguniform(1e-4, 1e-1),
        "batch_size": tune.choice([2, 4, 8, 16]),
        
    }
    
    scheduler = ASHAScheduler(
        metric="loss",
        mode="min",
        max_t=max_num_epochs,
        grace_period=1,
        reduction_factor=2)
    
    reporter = CLIReporter(
        # parameter_columns=["l1", "l2", "lr", "batch_size"],
        metric_columns=["loss", "accuracy", "training_iteration"])
    
    result = tune.run(
        partial(train_cifar, data_dir=data_dir),
        resources_per_trial={"cpu": num_workers, "gpu": gpus_per_trial},
        config=config,
        num_samples=num_samples,
        scheduler=scheduler,
        progress_reporter=reporter)

    best_trial = result.get_best_trial("loss", "min", "last")
    print("Best trial config: {}".format(best_trial.config))
    print("Best trial final validation loss: {}".format(
        best_trial.last_result["loss"]))
    print("Best trial final validation accuracy: {}".format(
        best_trial.last_result["accuracy"]))

    best_trained_model = Net(best_trial.config["l1"], best_trial.config["l2"])
    device = "cpu"
    if torch.cuda.is_available():
        device = "cuda:0"
        if gpus_per_trial > 1:
            best_trained_model = nn.DataParallel(best_trained_model)
    best_trained_model.to(device)

    best_checkpoint_dir = best_trial.checkpoint.value
    model_state, optimizer_state = torch.load(os.path.join(
        best_checkpoint_dir, "checkpoint"))
    
    best_trained_model.load_state_dict(model_state)

    test_acc = test_accuracy(best_trained_model, device)
    print("Best trial test set accuracy: {}".format(test_acc))


if __name__ == "__main__":
    # manually determine gpus per trial to see what's efficient
    # num samples = total number of experiments to run
    main(num_samples=10, max_num_epochs=25, gpus_per_trial=0.25) 

Files already downloaded and verified
Files already downloaded and verified


2020-11-13 14:48:16,344	INFO registry.py:65 -- Detected unknown callable for trainable. Converting to class.


== Status ==
Memory usage on this node: 7.4/94.3 GiB
Using AsyncHyperBand: num_stopped=0
Bracket: Iter 16.000: None | Iter 8.000: None | Iter 4.000: None | Iter 2.000: None | Iter 1.000: None
Resources requested: 2/40 CPUs, 0.25/4 GPUs, 0.0/53.52 GiB heap, 0.0/18.46 GiB objects (0/1.0 accelerator_type:RTX)
Result logdir: /home/brian/ray_results/DEFAULT
Number of trials: 100 (99 PENDING, 1 RUNNING)
+---------------------+----------+-------+--------------+------+------+-------------+
| Trial name          | status   | loc   |   batch_size |   l1 |   l2 |          lr |
|---------------------+----------+-------+--------------+------+------+-------------|
| DEFAULT_e1931_00001 | PENDING  |       |           16 |   64 |  256 | 0.00120355  |
| DEFAULT_e1931_00002 | PENDING  |       |            2 |    4 |   32 | 0.000811232 |
| DEFAULT_e1931_00003 | PENDING  |       |           16 |  128 |    4 | 0.000676203 |
| DEFAULT_e1931_00004 | PENDING  |       |            8 |  256 |   64 | 0.00126235 

Result for DEFAULT_e1931_00010:
  accuracy: 0.2928
  date: 2020-11-13_14-48-52
  done: true
  experiment_id: 4d112dadcaae4b879669fa4e2ffb603e
  experiment_tag: 10_batch_size=16,l1=8,l2=64,lr=0.00085198
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.8478457763671876
  node_ip: 145.52.252.20
  pid: 5390
  should_checkpoint: true
  time_since_restore: 34.40496563911438
  time_this_iter_s: 34.40496563911438
  time_total_s: 34.40496563911438
  timestamp: 1605275332
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00010
  
Result for DEFAULT_e1931_00013:
  accuracy: 0.3499
  date: 2020-11-13_14-48-52
  done: true
  experiment_id: 9d559e7839174804afaeddf7a021b981
  experiment_tag: 13_batch_size=16,l1=128,l2=16,lr=0.0012665
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.7425559041976928
  node_ip: 145.52.252.20
  pid: 5393
  should_checkpoint: true
  time_since_restore: 34.64450263977051
  time_this_iter_s: 34.64450263977051
  time_total_s: 3

Result for DEFAULT_e1931_00007:
  accuracy: 0.2667
  date: 2020-11-13_14-49-08
  done: true
  experiment_id: 338b12b3d7914e73b44793d77684f2e7
  experiment_tag: 7_batch_size=8,l1=8,l2=64,lr=0.014218
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.9422798272132873
  node_ip: 145.52.252.20
  pid: 5373
  should_checkpoint: true
  time_since_restore: 50.50981545448303
  time_this_iter_s: 50.50981545448303
  time_total_s: 50.50981545448303
  timestamp: 1605275348
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00007
  
Result for DEFAULT_e1931_00005:
  accuracy: 0.1311
  date: 2020-11-13_14-49-08
  done: true
  experiment_id: 24857da790144ee0b4c4876b8ce0bf7c
  experiment_tag: 5_batch_size=8,l1=16,l2=4,lr=0.018445
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.2229816040992736
  node_ip: 145.52.252.20
  pid: 5466
  should_checkpoint: true
  time_since_restore: 50.71414804458618
  time_this_iter_s: 50.71414804458618
  time_total_s: 50.7141480

[2m[36m(pid=5384)[0m [1,  2000] loss: 2.343
[2m[36m(pid=5383)[0m [1,  2000] loss: 2.274
[2m[36m(pid=5461)[0m [1,  2000] loss: 2.301
[2m[36m(pid=5397)[0m [2,  4000] loss: 0.702
[2m[36m(pid=5401)[0m [1,  2000] loss: 2.197
[2m[36m(pid=5377)[0m [2,  4000] loss: 0.841
[2m[36m(pid=5386)[0m [1, 10000] loss: 0.468
[2m[36m(pid=5379)[0m [1, 10000] loss: 0.383
[2m[36m(pid=5460)[0m [1, 10000] loss: 0.465
Result for DEFAULT_e1931_00021:
  accuracy: 0.4655
  date: 2020-11-13_14-49-35
  done: false
  experiment_id: 871d1ed32e754ae28829db7dd67f82e0
  experiment_tag: 21_batch_size=16,l1=128,l2=128,lr=0.011074
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.4852743953704834
  node_ip: 145.52.252.20
  pid: 5405
  should_checkpoint: true
  time_since_restore: 26.63757610321045
  time_this_iter_s: 26.63757610321045
  time_total_s: 26.63757610321045
  timestamp: 1605275375
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00021
  
== Status ==
Me

[2m[36m(pid=5383)[0m [1,  4000] loss: 1.014
[2m[36m(pid=5384)[0m [1,  4000] loss: 1.167
[2m[36m(pid=5376)[0m [4,  2000] loss: 1.415
[2m[36m(pid=5395)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00009:
  accuracy: 0.3787
  date: 2020-11-13_14-49-44
  done: true
  experiment_id: 3a9ce3d5022e45afac9a3460d6830e6d
  experiment_tag: 9_batch_size=8,l1=16,l2=8,lr=0.00098041
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.6308152586460114
  node_ip: 145.52.252.20
  pid: 5377
  should_checkpoint: true
  time_since_restore: 86.75754928588867
  time_this_iter_s: 34.736759424209595
  time_total_s: 86.75754928588867
  timestamp: 1605275384
  timesteps_since_restore: 0
  training_iteration: 2
  trial_id: e1931_00009
  
[2m[36m(pid=5395)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00014:
  accuracy: 0.0988
  date: 2020-11-13_14-49-45
  done: true
  experiment_id: 396d48e802214c9ea32800128ef0955d
  experiment_tag: 14_batch_size=4,

[2m[36m(pid=5386)[0m [1, 14000] loss: 0.334
[2m[36m(pid=5395)[0m [1,  2000] loss: 1.973
[2m[36m(pid=5379)[0m [1, 14000] loss: 0.258
[2m[36m(pid=5376)[0m [5,  2000] loss: 1.387
[2m[36m(pid=5451)[0m [1, 14000] loss: 0.239
[2m[36m(pid=5404)[0m Files already downloaded and verified
[2m[36m(pid=5388)[0m [1, 10000] loss: 0.461
[2m[36m(pid=5405)[0m [3,  2000] loss: 1.337
[2m[36m(pid=5372)[0m [1, 10000] loss: 0.468
[2m[36m(pid=5397)[0m [3,  4000] loss: 0.629
[2m[36m(pid=5404)[0m Files already downloaded and verified
[2m[36m(pid=5446)[0m [1,  2000] loss: 1.888
[2m[36m(pid=5382)[0m [1, 10000] loss: 0.304
[2m[36m(pid=5383)[0m [1,  8000] loss: 0.425
[2m[36m(pid=5464)[0m [1, 10000] loss: 0.455
[2m[36m(pid=5384)[0m [1,  8000] loss: 0.584
Result for DEFAULT_e1931_00000:
  accuracy: 0.4877
  date: 2020-11-13_14-50-07
  done: false
  experiment_id: 90eeb897d8a14f088e22e469ccd4fe05
  experiment_tag: 0_batch_size=16,l1=4,l2=32,lr=0.0048131
  hostname: gpuse

Result for DEFAULT_e1931_00019:
  accuracy: 0.0967
  date: 2020-11-13_14-50-15
  done: true
  experiment_id: 4c4f518cd38548f4acb930f08b9b7422
  experiment_tag: 19_batch_size=4,l1=256,l2=256,lr=0.06622
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.3418810456752777
  node_ip: 145.52.252.20
  pid: 5372
  should_checkpoint: true
  time_since_restore: 80.62135577201843
  time_this_iter_s: 80.62135577201843
  time_total_s: 80.62135577201843
  timestamp: 1605275415
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00019
  
Result for DEFAULT_e1931_00018:
  accuracy: 0.4382
  date: 2020-11-13_14-50-16
  done: false
  experiment_id: 81a285978dc843a69ab554bfbe1112f0
  experiment_tag: 18_batch_size=4,l1=128,l2=128,lr=0.0014119
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.5314319157719611
  node_ip: 145.52.252.20
  pid: 5382
  should_checkpoint: true
  time_since_restore: 82.36318397521973
  time_this_iter_s: 82.36318397521973
  time_total_s: 8

[2m[36m(pid=5382)[0m [2,  2000] loss: 1.457
Result for DEFAULT_e1931_00026:
  accuracy: 0.4864
  date: 2020-11-13_14-50-29
  done: true
  experiment_id: f19a3d6ba1cf469da09d3d4963014c9c
  experiment_tag: 26_batch_size=16,l1=8,l2=16,lr=0.0040928
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.4614098024368287
  node_ip: 145.52.252.20
  pid: 5446
  should_checkpoint: true
  time_since_restore: 43.880881786346436
  time_this_iter_s: 17.59655213356018
  time_total_s: 43.880881786346436
  timestamp: 1605275429
  timesteps_since_restore: 0
  training_iteration: 2
  trial_id: e1931_00026
  
[2m[36m(pid=5383)[0m [1, 12000] loss: 0.264
[2m[36m(pid=5384)[0m [1, 12000] loss: 0.389
[2m[36m(pid=5385)[0m [1,  6000] loss: 0.655
[2m[36m(pid=5464)[0m [1, 14000] loss: 0.307
[2m[36m(pid=5404)[0m [1,  4000] loss: 0.846
[2m[36m(pid=5386)[0m [1, 20000] loss: 0.234
[2m[36m(pid=5395)[0m [2,  2000] loss: 1.522
[2m[36m(pid=5375)[0m [1,  2000] loss: 2.100
[2m[36m(pid=53

[2m[36m(pid=5378)[0m [1,  2000] loss: 2.303
Result for DEFAULT_e1931_00012:
  accuracy: 0.1004
  date: 2020-11-13_14-50-51
  done: true
  experiment_id: 93d0da1d6b934f3ea40e8fbcd1308e5c
  experiment_tag: 12_batch_size=2,l1=64,l2=16,lr=0.033274
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.344740637588501
  node_ip: 145.52.252.20
  pid: 5386
  should_checkpoint: true
  time_since_restore: 153.50937366485596
  time_this_iter_s: 153.50937366485596
  time_total_s: 153.50937366485596
  timestamp: 1605275451
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00012
  
[2m[36m(pid=5381)[0m [1,  2000] loss: 2.337
[2m[36m(pid=5382)[0m [2,  6000] loss: 0.469
[2m[36m(pid=5383)[0m [1, 16000] loss: 0.196
Result for DEFAULT_e1931_00011:
  accuracy: 0.4069
  date: 2020-11-13_14-50-55
  done: false
  experiment_id: a202681bb5104d24b0e06fd228b5343e
  experiment_tag: 11_batch_size=2,l1=16,l2=64,lr=0.00023134
  hostname: gpuserver
  iterations_since_restore:

[2m[36m(pid=5397)[0m [5,  2000] loss: 1.066
[2m[36m(pid=5378)[0m [1,  4000] loss: 1.148
[2m[36m(pid=5398)[0m Files already downloaded and verified
[2m[36m(pid=5381)[0m [1,  4000] loss: 1.170
Result for DEFAULT_e1931_00027:
  accuracy: 0.2763
  date: 2020-11-13_14-51-04
  done: true
  experiment_id: 64ec20e5a1d044fea910e8a311fee2e0
  experiment_tag: 27_batch_size=4,l1=256,l2=4,lr=0.0076377
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.8761511580228805
  node_ip: 145.52.252.20
  pid: 5385
  should_checkpoint: true
  time_since_restore: 77.366525888443
  time_this_iter_s: 77.366525888443
  time_total_s: 77.366525888443
  timestamp: 1605275464
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00027
  
== Status ==
Memory usage on this node: 47.1/94.3 GiB
Using AsyncHyperBand: num_stopped=22
Bracket: Iter 16.000: None | Iter 8.000: -1.3700209853172303 | Iter 4.000: -1.3866280179023742 | Iter 2.000: -1.4646864913463593 | Iter 1.000: -1.8619984

Result for DEFAULT_e1931_00000:
  accuracy: 0.5058
  date: 2020-11-13_14-51-21
  done: false
  experiment_id: 90eeb897d8a14f088e22e469ccd4fe05
  experiment_tag: 0_batch_size=16,l1=4,l2=32,lr=0.0048131
  hostname: gpuserver
  iterations_since_restore: 9
  loss: 1.3642376733779906
  node_ip: 145.52.252.20
  pid: 5376
  should_checkpoint: true
  time_since_restore: 183.37632131576538
  time_this_iter_s: 19.02251625061035
  time_total_s: 183.37632131576538
  timestamp: 1605275481
  timesteps_since_restore: 0
  training_iteration: 9
  trial_id: e1931_00000
  
[2m[36m(pid=5392)[0m [1,  2000] loss: 2.014
[2m[36m(pid=5455)[0m [1,  2000] loss: 2.025
Result for DEFAULT_e1931_00004:
  accuracy: 0.5927
  date: 2020-11-13_14-51-24
  done: false
  experiment_id: d40c806e9bd146c7ab6985bbb3b9e8f2
  experiment_tag: 4_batch_size=8,l1=256,l2=64,lr=0.0012624
  hostname: gpuserver
  iterations_since_restore: 5
  loss: 1.158305498099327
  node_ip: 145.52.252.20
  pid: 5397
  should_checkpoint: true
  

[2m[36m(pid=5455)[0m [1,  4000] loss: 0.854
Result for DEFAULT_e1931_00022:
  accuracy: 0.4748
  date: 2020-11-13_14-51-35
  done: false
  experiment_id: 404de1e772c348bbbb13fbf8b98542c2
  experiment_tag: 22_batch_size=2,l1=256,l2=32,lr=0.00073597
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.4393111108645797
  node_ip: 145.52.252.20
  pid: 5383
  should_checkpoint: true
  time_since_restore: 146.19572138786316
  time_this_iter_s: 146.19572138786316
  time_total_s: 146.19572138786316
  timestamp: 1605275495
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00022
  
[2m[36m(pid=5397)[0m [6,  2000] loss: 0.987
[2m[36m(pid=5374)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00020:
  accuracy: 0.0981
  date: 2020-11-13_14-51-36
  done: true
  experiment_id: a414f9ed4ef8407d8697df5bb0812786
  experiment_tag: 20_batch_size=2,l1=4,l2=256,lr=0.028648
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.3256638288497924


[2m[36m(pid=7457)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00036:
  accuracy: 0.4014
  date: 2020-11-13_14-51-45
  done: false
  experiment_id: 940e6a81aa124ac79f48a30cb7888abb
  experiment_tag: 36_batch_size=8,l1=16,l2=4,lr=0.0044137
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.5968460078716278
  node_ip: 145.52.252.20
  pid: 5455
  should_checkpoint: true
  time_since_restore: 45.034544706344604
  time_this_iter_s: 45.034544706344604
  time_total_s: 45.034544706344604
  timestamp: 1605275505
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00036
  
[2m[36m(pid=5397)[0m [6,  4000] loss: 0.497
[2m[36m(pid=7499)[0m Files already downloaded and verified
[2m[36m(pid=5383)[0m [2,  2000] loss: 1.442
[2m[36m(pid=7499)[0m Files already downloaded and verified
[2m[36m(pid=5378)[0m [1, 12000] loss: 0.321
[2m[36m(pid=5451)[0m [2,  8000] loss: 0.379
Result for DEFAULT_e1931_00032:
  accuracy: 0.1006
  date: 2020-

[2m[36m(pid=7667)[0m 2020-11-13 14:52:04,186	INFO (unknown file):0 -- gc.collect() freed 13 refs in 0.04820607230067253 seconds2020-11-13 14:52:04,365	INFO (unknown file):0 -- gc.collect() freed 272 refs in 0.22407881170511246 seconds



[2m[36m(pid=5389)[0m [1,  6000] loss: 0.611
[2m[36m(pid=5387)[0m [1, 10000] loss: 0.465
[2m[36m(pid=5379)[0m [2, 12000] loss: 0.253
[2m[36m(pid=5382)[0m [3,  6000] loss: 0.427
[2m[36m(pid=5397)[0m [7,  2000] loss: 0.904
[2m[36m(pid=5392)[0m [2,  4000] loss: 0.696
[2m[36m(pid=7457)[0m [1,  4000] loss: 1.150
[2m[36m(pid=5455)[0m [2,  4000] loss: 0.761
[2m[36m(pid=5383)[0m [2,  6000] loss: 0.469
[2m[36m(pid=7667)[0m Files already downloaded and verified
[2m[36m(pid=5378)[0m [1, 16000] loss: 0.221
[2m[36m(pid=7667)[0m Files already downloaded and verified
[2m[36m(pid=7603)[0m [1,  2000] loss: 2.298
Result for DEFAULT_e1931_00034:
  accuracy: 0.315
  date: 2020-11-13_14-52-13
  done: true
  experiment_id: 2cba9d591b0d464d8e397e038b44e754
  experiment_tag: 34_batch_size=8,l1=8,l2=128,lr=0.012123
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.8348942591667174
  node_ip: 145.52.252.20
  pid: 5398
  should_checkpoint: true
  time_since_resto

2020-11-13 14:52:14,426	INFO (unknown file):0 -- gc.collect() freed 147 refs in 0.2398098148405552 seconds


[2m[36m(pid=5451)[0m [2, 12000] loss: 0.250
[2m[36m(pid=5374)[0m [1,  6000] loss: 0.586
[2m[36m(pid=7499)[0m [1,  4000] loss: 1.159
Result for DEFAULT_e1931_00033:
  accuracy: 0.1032
  date: 2020-11-13_14-52-15
  done: true
  experiment_id: 54b06bb70f8e4a5d8375d154468c0036
  experiment_tag: 33_batch_size=4,l1=4,l2=4,lr=0.041574
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.3060657866477965
  node_ip: 145.52.252.20
  pid: 5387
  should_checkpoint: true
  time_since_restore: 83.120530128479
  time_this_iter_s: 83.120530128479
  time_total_s: 83.120530128479
  timestamp: 1605275535
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00033
  
[2m[36m(pid=5389)[0m [1,  8000] loss: 0.455
[2m[36m(pid=5379)[0m [2, 14000] loss: 0.217
[2m[36m(pid=5382)[0m [3,  8000] loss: 0.315
Result for DEFAULT_e1931_00041:
  accuracy: 0.1514
  date: 2020-11-13_14-52-20
  done: true
  experiment_id: ecb025fe6726482f8df5cec1bcd85c6e
  experiment_tag: 41_batch

== Status ==
Memory usage on this node: 49.3/94.3 GiB
Using AsyncHyperBand: num_stopped=32
Bracket: Iter 16.000: None | Iter 8.000: -1.3700209853172303 | Iter 4.000: -1.3866280179023742 | Iter 2.000: -1.46796318025589 | Iter 1.000: -1.9422798272132873
Resources requested: 32/40 CPUs, 4.0/4 GPUs, 0.0/53.52 GiB heap, 0.0/18.46 GiB objects (0/1.0 accelerator_type:RTX)
Result logdir: /home/brian/ray_results/DEFAULT
Number of trials: 100 (51 PENDING, 16 RUNNING, 33 TERMINATED)
+---------------------+------------+--------------------+--------------+------+------+-------------+---------+------------+----------------------+
| Trial name          | status     | loc                |   batch_size |   l1 |   l2 |          lr |    loss |   accuracy |   training_iteration |
|---------------------+------------+--------------------+--------------+------+------+-------------+---------+------------+----------------------|
| DEFAULT_e1931_00049 | PENDING    |                    |            4 |  128 |   

[2m[36m(pid=5389)[0m [1, 12000] loss: 0.300
[2m[36m(pid=5379)[0m [2, 18000] loss: 0.162
[2m[36m(pid=7795)[0m [1,  2000] loss: 2.308
[2m[36m(pid=5397)[0m [8,  2000] loss: 0.826
[2m[36m(pid=7825)[0m [1,  2000] loss: 1.969
Result for DEFAULT_e1931_00045:
  accuracy: 0.1952
  date: 2020-11-13_14-52-43
  done: true
  experiment_id: 488c36dddabf4cc99cc4a34a04f8b853
  experiment_tag: 45_batch_size=16,l1=8,l2=16,lr=0.00055764
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.189368620681763
  node_ip: 145.52.252.20
  pid: 7720
  should_checkpoint: true
  time_since_restore: 28.23756241798401
  time_this_iter_s: 28.23756241798401
  time_total_s: 28.23756241798401
  timestamp: 1605275563
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00045
  
[2m[36m(pid=5392)[0m [3,  4000] loss: 0.631
[2m[36m(pid=5383)[0m [2, 12000] loss: 0.226
[2m[36m(pid=7603)[0m [1,  8000] loss: 0.488
[2m[36m(pid=7667)[0m [1,  6000] loss: 0.800
[2m[36m(pid=5451

[2m[36m(pid=5378)[0m [2,  2000] loss: 1.619
[2m[36m(pid=7829)[0m [1,  2000] loss: 2.304
[2m[36m(pid=7795)[0m [1,  6000] loss: 0.693
[2m[36m(pid=5392)[0m [4,  2000] loss: 1.148
Result for DEFAULT_e1931_00043:
  accuracy: 0.3547
  date: 2020-11-13_14-53-10
  done: false
  experiment_id: b67d5cfb7fe7487f910a5754534da3fb
  experiment_tag: 43_batch_size=4,l1=64,l2=8,lr=0.00045466
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.7697985737085342
  node_ip: 145.52.252.20
  pid: 7603
  should_checkpoint: true
  time_since_restore: 78.69945621490479
  time_this_iter_s: 78.69945621490479
  time_total_s: 78.69945621490479
  timestamp: 1605275590
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00043
  
== Status ==
Memory usage on this node: 49.4/94.3 GiB
Using AsyncHyperBand: num_stopped=33
Bracket: Iter 16.000: None | Iter 8.000: -1.2365930571973323 | Iter 4.000: -1.3866280179023742 | Iter 2.000: -1.46796318025589 | Iter 1.000: -1.8761511580228805


[2m[36m(pid=5392)[0m [4,  4000] loss: 0.587
[2m[36m(pid=5383)[0m [2, 18000] loss: 0.150
[2m[36m(pid=7603)[0m [2,  2000] loss: 1.715
[2m[36m(pid=5379)[0m [3,  2000] loss: 1.419
[2m[36m(pid=7667)[0m [1, 12000] loss: 0.400
[2m[36m(pid=7499)[0m [1, 16000] loss: 0.290
[2m[36m(pid=5374)[0m [1, 18000] loss: 0.175
[2m[36m(pid=7753)[0m [1, 10000] loss: 0.463
[2m[36m(pid=5382)[0m [4,  8000] loss: 0.296
[2m[36m(pid=7825)[0m [2,  4000] loss: 0.686
[2m[36m(pid=5397)[0m [9,  4000] loss: 0.410
[2m[36m(pid=5389)[0m [1, 20000] loss: 0.176
[2m[36m(pid=5378)[0m [2,  6000] loss: 0.521
[2m[36m(pid=7795)[0m [1, 10000] loss: 0.385
[2m[36m(pid=5451)[0m [3,  2000] loss: 1.453
Result for DEFAULT_e1931_00035:
  accuracy: 0.573
  date: 2020-11-13_14-53-31
  done: false
  experiment_id: 6e974a8676144a36aff7dc1bfff5d5ca
  experiment_tag: 35_batch_size=8,l1=256,l2=16,lr=0.0028954
  hostname: gpuserver
  iterations_since_restore: 4
  loss: 1.224947109913826
  node_ip: 145.

[2m[36m(pid=5374)[0m [1, 20000] loss: 0.158
Result for DEFAULT_e1931_00004:
  accuracy: 0.624
  date: 2020-11-13_14-53-38
  done: false
  experiment_id: d40c806e9bd146c7ab6985bbb3b9e8f2
  experiment_tag: 4_batch_size=8,l1=256,l2=64,lr=0.0012624
  hostname: gpuserver
  iterations_since_restore: 9
  loss: 1.1371944277822972
  node_ip: 145.52.252.20
  pid: 5397
  should_checkpoint: true
  time_since_restore: 320.95007824897766
  time_this_iter_s: 33.23570728302002
  time_total_s: 320.95007824897766
  timestamp: 1605275618
  timesteps_since_restore: 0
  training_iteration: 9
  trial_id: e1931_00004
  
[2m[36m(pid=7753)[0m [1, 12000] loss: 0.386
[2m[36m(pid=5382)[0m [4, 10000] loss: 0.236
[2m[36m(pid=5378)[0m [2,  8000] loss: 0.382
[2m[36m(pid=5451)[0m [3,  4000] loss: 0.731
[2m[36m(pid=7795)[0m [1, 12000] loss: 0.311
[2m[36m(pid=7829)[0m [1,  8000] loss: 0.560
[2m[36m(pid=5392)[0m [5,  2000] loss: 1.080
[2m[36m(pid=7603)[0m [2,  6000] loss: 0.519
Result for DEFAU

[2m[36m(pid=5378)[0m [2, 10000] loss: 0.307
[2m[36m(pid=5451)[0m [3,  6000] loss: 0.478
[2m[36m(pid=7795)[0m [1, 14000] loss: 0.265
[2m[36m(pid=7829)[0m [1, 10000] loss: 0.430
[2m[36m(pid=5392)[0m [5,  4000] loss: 0.546
Result for DEFAULT_e1931_00039:
  accuracy: 0.4243
  date: 2020-11-13_14-53-57
  done: false
  experiment_id: 7b64ec48082747aba769d71e62500020
  experiment_tag: 39_batch_size=2,l1=8,l2=128,lr=0.0012714
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.565498595881462
  node_ip: 145.52.252.20
  pid: 5374
  should_checkpoint: true
  time_since_restore: 147.29898858070374
  time_this_iter_s: 147.29898858070374
  time_total_s: 147.29898858070374
  timestamp: 1605275637
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00039
  
== Status ==
Memory usage on this node: 49.2/94.3 GiB
Using AsyncHyperBand: num_stopped=33
Bracket: Iter 16.000: None | Iter 8.000: -1.2365930571973323 | Iter 4.000: -1.2300583099722862 | Iter 2.000: -1.

Result for DEFAULT_e1931_00042:
  accuracy: 0.1024
  date: 2020-11-13_14-54-06
  done: true
  experiment_id: dc6edae1b76a458dbcbc95293a4b3388
  experiment_tag: 42_batch_size=2,l1=8,l2=4,lr=0.01402
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.317559240818024
  node_ip: 145.52.252.20
  pid: 7499
  should_checkpoint: true
  time_since_restore: 144.99245190620422
  time_this_iter_s: 144.99245190620422
  time_total_s: 144.99245190620422
  timestamp: 1605275646
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00042
  
[2m[36m(pid=5451)[0m [3,  8000] loss: 0.357
[2m[36m(pid=7795)[0m [1, 16000] loss: 0.235
Result for DEFAULT_e1931_00035:
  accuracy: 0.584
  date: 2020-11-13_14-54-07
  done: false
  experiment_id: 6e974a8676144a36aff7dc1bfff5d5ca
  experiment_tag: 35_batch_size=8,l1=256,l2=16,lr=0.0028954
  hostname: gpuserver
  iterations_since_restore: 5
  loss: 1.2439915586471557
  node_ip: 145.52.252.20
  pid: 5392
  should_checkpoint: true
  tim

[2m[36m(pid=5451)[0m [3, 10000] loss: 0.291
[2m[36m(pid=8438)[0m Files already downloaded and verified
[2m[36m(pid=7795)[0m [1, 18000] loss: 0.207
[2m[36m(pid=5392)[0m [6,  2000] loss: 1.003
[2m[36m(pid=8438)[0m Files already downloaded and verified
[2m[36m(pid=5374)[0m [2,  4000] loss: 0.765
[2m[36m(pid=7825)[0m [4,  2000] loss: 1.181
[2m[36m(pid=5389)[0m [2,  6000] loss: 0.595
[2m[36m(pid=5379)[0m [3, 12000] loss: 0.235
[2m[36m(pid=5382)[0m [5,  6000] loss: 0.370
[2m[36m(pid=8421)[0m Files already downloaded and verified
[2m[36m(pid=5383)[0m [3,  6000] loss: 0.415
[2m[36m(pid=8421)[0m Files already downloaded and verified
[2m[36m(pid=5378)[0m [2, 16000] loss: 0.182
[2m[36m(pid=7753)[0m [1, 20000] loss: 0.231
[2m[36m(pid=8424)[0m [1,  2000] loss: 1.948
[2m[36m(pid=8407)[0m [1,  2000] loss: 2.301
Result for DEFAULT_e1931_00044:
  accuracy: 0.0993
  date: 2020-11-13_14-54-31
  done: true
  experiment_id: 4c62a916da524beda398d8a56f177466

[2m[36m(pid=5451)[0m [3, 14000] loss: 0.206
[2m[36m(pid=8652)[0m Files already downloaded and verified
[2m[36m(pid=5389)[0m [2, 10000] loss: 0.353
[2m[36m(pid=5374)[0m [2,  8000] loss: 0.379
Result for DEFAULT_e1931_00046:
  accuracy: 0.0986
  date: 2020-11-13_14-54-46
  done: true
  experiment_id: 5d740899f11f410fb5eea764b2c9b997
  experiment_tag: 46_batch_size=2,l1=16,l2=8,lr=0.0087786
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.319085218477249
  node_ip: 145.52.252.20
  pid: 7753
  should_checkpoint: true
  time_since_restore: 149.0549120903015
  time_this_iter_s: 149.0549120903015
  time_total_s: 149.0549120903015
  timestamp: 1605275686
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00046
  
[2m[36m(pid=8438)[0m [1,  4000] loss: 1.157
[2m[36m(pid=5379)[0m [3, 16000] loss: 0.173
Result for DEFAULT_e1931_00053:
  accuracy: 0.365
  date: 2020-11-13_14-54-48
  done: false
  experiment_id: 265b3378216c4d74bc819fe2277d3dcf
  ex

[2m[36m(pid=5379)[0m [3, 18000] loss: 0.152
[2m[36m(pid=8438)[0m [1,  6000] loss: 0.769
[2m[36m(pid=8421)[0m [2,  2000] loss: 1.600
[2m[36m(pid=7795)[0m [2,  2000] loss: 1.810
[2m[36m(pid=5383)[0m [3, 12000] loss: 0.203
[2m[36m(pid=8424)[0m [2,  2000] loss: 1.682
[2m[36m(pid=8422)[0m [1,  4000] loss: 1.009
Result for DEFAULT_e1931_00053:
  accuracy: 0.4286
  date: 2020-11-13_14-55-06
  done: true
  experiment_id: 265b3378216c4d74bc819fe2277d3dcf
  experiment_tag: 53_batch_size=16,l1=8,l2=16,lr=0.011271
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.6241672907829285
  node_ip: 145.52.252.20
  pid: 8421
  should_checkpoint: true
  time_since_restore: 46.20709538459778
  time_this_iter_s: 18.477535247802734
  time_total_s: 46.20709538459778
  timestamp: 1605275706
  timesteps_since_restore: 0
  training_iteration: 2
  trial_id: e1931_00053
  
== Status ==
Memory usage on this node: 49.2/94.3 GiB
Using AsyncHyperBand: num_stopped=40
Bracket: Iter 16.000:

Result for DEFAULT_e1931_00035:
  accuracy: 0.5904
  date: 2020-11-13_14-55-19
  done: false
  experiment_id: 6e974a8676144a36aff7dc1bfff5d5ca
  experiment_tag: 35_batch_size=8,l1=256,l2=16,lr=0.0028954
  hostname: gpuserver
  iterations_since_restore: 7
  loss: 1.234056989991665
  node_ip: 145.52.252.20
  pid: 5392
  should_checkpoint: true
  time_since_restore: 260.0631670951843
  time_this_iter_s: 35.97659420967102
  time_total_s: 260.0631670951843
  timestamp: 1605275719
  timesteps_since_restore: 0
  training_iteration: 7
  trial_id: e1931_00035
  
[2m[36m(pid=5378)[0m [3,  2000] loss: 1.416
[2m[36m(pid=5451)[0m [3, 20000] loss: 0.146
[2m[36m(pid=5374)[0m [2, 14000] loss: 0.221
[2m[36m(pid=5389)[0m [2, 16000] loss: 0.221
[2m[36m(pid=8750)[0m [1,  4000] loss: 1.114
[2m[36m(pid=8652)[0m [1,  6000] loss: 0.763
[2m[36m(pid=5382)[0m [6,  4000] loss: 0.523
[2m[36m(pid=8932)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00051:
  accuracy: 0.402

2020-11-13 14:55:25,233	INFO (unknown file):0 -- gc.collect() freed 244 refs in 0.19218914955854416 seconds


[2m[36m(pid=8438)[0m [1, 10000] loss: 0.458
[2m[36m(pid=7795)[0m [2,  6000] loss: 0.612
[2m[36m(pid=8932)[0m Files already downloaded and verified
[2m[36m(pid=5383)[0m [3, 16000] loss: 0.153
[2m[36m(pid=7825)[0m [6,  2000] loss: 1.073
Result for DEFAULT_e1931_00011:
  accuracy: 0.5184
  date: 2020-11-13_14-55-29
  done: false
  experiment_id: a202681bb5104d24b0e06fd228b5343e
  experiment_tag: 11_batch_size=2,l1=16,l2=64,lr=0.00023134
  hostname: gpuserver
  iterations_since_restore: 3
  loss: 1.3226234712135048
  node_ip: 145.52.252.20
  pid: 5379
  should_checkpoint: true
  time_since_restore: 431.8637671470642
  time_this_iter_s: 136.85145139694214
  time_total_s: 431.8637671470642
  timestamp: 1605275729
  timesteps_since_restore: 0
  training_iteration: 3
  trial_id: e1931_00011
  
[2m[36m(pid=8851)[0m [1,  2000] loss: 2.120
== Status ==
Memory usage on this node: 48.2/94.3 GiB
Using AsyncHyperBand: num_stopped=42
Bracket: Iter 16.000: None | Iter 8.000: -1.236593

[2m[36m(pid=5383)[0m [3, 18000] loss: 0.136
[2m[36m(pid=7825)[0m [6,  4000] loss: 0.557
[2m[36m(pid=8932)[0m [1,  2000] loss: 1.921
[2m[36m(pid=5379)[0m [4,  2000] loss: 1.312
[2m[36m(pid=8851)[0m [1,  4000] loss: 1.009
[2m[36m(pid=5378)[0m [3,  6000] loss: 0.464
[2m[36m(pid=5392)[0m [8,  4000] loss: 0.464
[2m[36m(pid=5389)[0m [2, 20000] loss: 0.180
[2m[36m(pid=5374)[0m [2, 18000] loss: 0.166
Result for DEFAULT_e1931_00058:
  accuracy: 0.3274
  date: 2020-11-13_14-55-45
  done: false
  experiment_id: d4cbddf916974a0fbd437fdaee5c32e1
  experiment_tag: 58_batch_size=16,l1=256,l2=16,lr=0.02587
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.7428031789779663
  node_ip: 145.52.252.20
  pid: 8932
  should_checkpoint: true
  time_since_restore: 26.91197371482849
  time_this_iter_s: 26.91197371482849
  time_total_s: 26.91197371482849
  timestamp: 1605275745
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00058
  
== Status ==
Memo

2020-11-13 14:55:55,400	INFO (unknown file):0 -- gc.collect() freed 200 refs in 0.21981262788176537 seconds


[2m[36m(pid=5374)[0m [2, 20000] loss: 0.147
[2m[36m(pid=8932)[0m [2,  2000] loss: 1.780
[2m[36m(pid=8750)[0m [1, 10000] loss: 0.370
[2m[36m(pid=8652)[0m [1, 12000] loss: 0.347
[2m[36m(pid=8993)[0m [1,  4000] loss: 1.021
[2m[36m(pid=5382)[0m [6, 10000] loss: 0.209
[2m[36m(pid=7825)[0m [7,  2000] loss: 1.047
[2m[36m(pid=7795)[0m [2, 12000] loss: 0.303
[2m[36m(pid=8438)[0m [1, 16000] loss: 0.277
[2m[36m(pid=5451)[0m [4,  4000] loss: 0.703
[2m[36m(pid=9126)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00038:
  accuracy: 0.3768
  date: 2020-11-13_14-56-02
  done: true
  experiment_id: ac894e4019ef4fe28b28e8ed9f4b8754
  experiment_tag: 38_batch_size=2,l1=32,l2=32,lr=0.003074
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.715252740932256
  node_ip: 145.52.252.20
  pid: 5389
  should_checkpoint: true
  time_since_restore: 282.2733573913574
  time_this_iter_s: 136.12695598602295
  time_total_s: 282.2733573913574
  timestamp: 1

[2m[36m(pid=9184)[0m Files already downloaded and verified
[2m[36m(pid=8652)[0m [1, 14000] loss: 0.283
[2m[36m(pid=9204)[0m Files already downloaded and verified
[2m[36m(pid=7825)[0m [7,  4000] loss: 0.538
[2m[36m(pid=8993)[0m [1,  6000] loss: 0.666
[2m[36m(pid=9184)[0m Files already downloaded and verified
[2m[36m(pid=7795)[0m [2, 14000] loss: 0.260
[2m[36m(pid=9204)[0m Files already downloaded and verified
[2m[36m(pid=8438)[0m [1, 18000] loss: 0.244
[2m[36m(pid=5451)[0m [4,  6000] loss: 0.464
Result for DEFAULT_e1931_00039:
  accuracy: 0.4604
  date: 2020-11-13_14-56-15
  done: true
  experiment_id: 7b64ec48082747aba769d71e62500020
  experiment_tag: 39_batch_size=2,l1=8,l2=128,lr=0.0012714
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.5099382144771516
  node_ip: 145.52.252.20
  pid: 5374
  should_checkpoint: true
  time_since_restore: 285.5686502456665
  time_this_iter_s: 138.26966166496277
  time_total_s: 285.5686502456665
  timestamp: 1

[2m[36m(pid=9216)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00060:
  accuracy: 0.4765
  date: 2020-11-13_14-56-23
  done: false
  experiment_id: ec3769ae4df844378fab6a068b3f17ec
  experiment_tag: 60_batch_size=16,l1=64,l2=256,lr=0.007132
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.4185985919952393
  node_ip: 145.52.252.20
  pid: 9126
  should_checkpoint: true
  time_since_restore: 26.655065298080444
  time_this_iter_s: 26.655065298080444
  time_total_s: 26.655065298080444
  timestamp: 1605275783
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00060
  
[2m[36m(pid=8652)[0m [1, 16000] loss: 0.239
[2m[36m(pid=9216)[0m Files already downloaded and verified
[2m[36m(pid=8993)[0m [1,  8000] loss: 0.494
[2m[36m(pid=7795)[0m [2, 16000] loss: 0.226
[2m[36m(pid=9184)[0m [1,  2000] loss: 2.301
[2m[36m(pid=9204)[0m [1,  2000] loss: 2.345
[2m[36m(pid=5451)[0m [4,  8000] loss: 0.358
[2m[36m(pid=8438)[0m [1, 20

== Status ==
Memory usage on this node: 48.9/94.3 GiB
Using AsyncHyperBand: num_stopped=47
Bracket: Iter 16.000: None | Iter 8.000: -1.20817752943635 | Iter 4.000: -1.2275027099430562 | Iter 2.000: -1.46796318025589 | Iter 1.000: -1.8708154000163078
Resources requested: 32/40 CPUs, 4.0/4 GPUs, 0.0/53.52 GiB heap, 0.0/18.46 GiB objects (0/1.0 accelerator_type:RTX)
Result logdir: /home/brian/ray_results/DEFAULT
Number of trials: 100 (35 PENDING, 16 RUNNING, 49 TERMINATED)
+---------------------+------------+--------------------+--------------+------+------+-------------+---------+------------+----------------------+
| Trial name          | status     | loc                |   batch_size |   l1 |   l2 |          lr |    loss |   accuracy |   training_iteration |
|---------------------+------------+--------------------+--------------+------+------+-------------+---------+------------+----------------------|
| DEFAULT_e1931_00065 | PENDING    |                    |            2 |   64 |   32

[2m[36m(pid=8851)[0m [1, 18000] loss: 0.216
[2m[36m(pid=7825)[0m [9,  2000] loss: 1.001
Result for DEFAULT_e1931_00047:
  accuracy: 0.2988
  date: 2020-11-13_14-57-06
  done: true
  experiment_id: 6b77200f8c99447ba793fab2e4358013
  experiment_tag: 47_batch_size=2,l1=32,l2=4,lr=0.0028169
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.8674825157981365
  node_ip: 145.52.252.20
  pid: 7795
  should_checkpoint: true
  time_since_restore: 284.9678361415863
  time_this_iter_s: 136.99152040481567
  time_total_s: 284.9678361415863
  timestamp: 1605275826
  timesteps_since_restore: 0
  training_iteration: 2
  trial_id: e1931_00047
  
[2m[36m(pid=5379)[0m [4, 16000] loss: 0.162
[2m[36m(pid=8750)[0m [2, 10000] loss: 0.321
[2m[36m(pid=9445)[0m [1,  2000] loss: 1.738
[2m[36m(pid=5382)[0m [7, 10000] loss: 0.211
[2m[36m(pid=9126)[0m [4,  2000] loss: 1.219
[2m[36m(pid=9216)[0m [1,  8000] loss: 0.486
[2m[36m(pid=8993)[0m [1, 16000] loss: 0.248
Result for DEFAULT

[2m[36m(pid=9216)[0m [1, 10000] loss: 0.365
Result for DEFAULT_e1931_00062:
  accuracy: 0.0961
  date: 2020-11-13_14-57-24
  done: true
  experiment_id: 16206ebabddd4a6da8a643375068b231
  experiment_tag: 62_batch_size=4,l1=16,l2=8,lr=0.072023
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.3327603048801424
  node_ip: 145.52.252.20
  pid: 9204
  should_checkpoint: true
  time_since_restore: 78.56658911705017
  time_this_iter_s: 78.56658911705017
  time_total_s: 78.56658911705017
  timestamp: 1605275844
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00062
  
[2m[36m(pid=9645)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00061:
  accuracy: 0.256
  date: 2020-11-13_14-57-25
  done: true
  experiment_id: 681eb119e7a74cad9c4d25a543df0816
  experiment_tag: 61_batch_size=4,l1=64,l2=64,lr=0.00017459
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.0275282989501955
  node_ip: 145.52.252.20
  pid: 9184
  should_checkpoi

[2m[36m(pid=9762)[0m Files already downloaded and verified
[2m[36m(pid=9741)[0m Files already downloaded and verified
[2m[36m(pid=9762)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00057:
  accuracy: 0.2747
  date: 2020-11-13_14-57-36
  done: true
  experiment_id: 68f8fc0d25684175bdf8dc2a4d118587
  experiment_tag: 57_batch_size=2,l1=128,l2=64,lr=0.0049275
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.9623720501363278
  node_ip: 145.52.252.20
  pid: 8851
  should_checkpoint: true
  time_since_restore: 148.42517590522766
  time_this_iter_s: 148.42517590522766
  time_total_s: 148.42517590522766
  timestamp: 1605275856
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00057
  
[2m[36m(pid=8993)[0m [1, 20000] loss: 0.202
[2m[36m(pid=7825)[0m [10,  2000] loss: 0.973
[2m[36m(pid=9670)[0m [1,  2000] loss: 2.333
[2m[36m(pid=9645)[0m [1,  2000] loss: 1.916
[2m[36m(pid=5383)[0m [4, 16000] loss: 0.138
[2m[36m(pid=5

[2m[36m(pid=9952)[0m Files already downloaded and verified
[2m[36m(pid=5382)[0m [8,  6000] loss: 0.321
[2m[36m(pid=9952)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00002:
  accuracy: 0.4972
  date: 2020-11-13_14-57-59
  done: true
  experiment_id: 1358c1471a804e3a8e1b43847cd66522
  experiment_tag: 2_batch_size=2,l1=4,l2=32,lr=0.00081123
  hostname: gpuserver
  iterations_since_restore: 4
  loss: 1.3786270138327033
  node_ip: 145.52.252.20
  pid: 5451
  should_checkpoint: true
  time_since_restore: 581.3290061950684
  time_this_iter_s: 141.02569389343262
  time_total_s: 581.3290061950684
  timestamp: 1605275879
  timesteps_since_restore: 0
  training_iteration: 4
  trial_id: e1931_00002
  
[2m[36m(pid=9645)[0m [2,  2000] loss: 1.808
[2m[36m(pid=9885)[0m [1,  2000] loss: 2.287
[2m[36m(pid=9741)[0m [1,  4000] loss: 1.147
Result for DEFAULT_e1931_00048:
  accuracy: 0.5937
  date: 2020-11-13_14-58-01
  done: false
  experiment_id: 97475105d8534707b72

[2m[36m(pid=9992)[0m [1,  2000] loss: 2.330
[2m[36m(pid=9558)[0m [1, 10000] loss: 0.358
Result for DEFAULT_e1931_00022:
  accuracy: 0.5898
  date: 2020-11-13_14-58-21
  done: false
  experiment_id: 404de1e772c348bbbb13fbf8b98542c2
  experiment_tag: 22_batch_size=2,l1=256,l2=32,lr=0.00073597
  hostname: gpuserver
  iterations_since_restore: 4
  loss: 1.1733361815563519
  node_ip: 145.52.252.20
  pid: 5383
  should_checkpoint: true
  time_since_restore: 552.0331761837006
  time_this_iter_s: 133.7221565246582
  time_total_s: 552.0331761837006
  timestamp: 1605275901
  timesteps_since_restore: 0
  training_iteration: 4
  trial_id: e1931_00022
  
== Status ==
Memory usage on this node: 49.2/94.3 GiB
Using AsyncHyperBand: num_stopped=58
Bracket: Iter 16.000: None | Iter 8.000: -1.20817752943635 | Iter 4.000: -1.2585972864810377 | Iter 2.000: -1.486377281832695 | Iter 1.000: -1.8708154000163078
Resources requested: 32/40 CPUs, 4.0/4 GPUs, 0.0/53.52 GiB heap, 0.0/18.46 GiB objects (0/1.0

[2m[36m(pid=8652)[0m [2, 14000] loss: 0.225
Result for DEFAULT_e1931_00075:
  accuracy: 0.4139
  date: 2020-11-13_14-58-34
  done: false
  experiment_id: 026c16fc9d22453192e6200a12ddedf9
  experiment_tag: 75_batch_size=16,l1=8,l2=256,lr=0.0042701
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.561561541366577
  node_ip: 145.52.252.20
  pid: 10057
  should_checkpoint: true
  time_since_restore: 27.97012734413147
  time_this_iter_s: 27.97012734413147
  time_total_s: 27.97012734413147
  timestamp: 1605275914
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00075
  
[2m[36m(pid=10032)[0m [1,  4000] loss: 0.836
[2m[36m(pid=9885)[0m [1,  8000] loss: 0.565
[2m[36m(pid=10055)[0m [1,  4000] loss: 1.136
[2m[36m(pid=9952)[0m [1,  6000] loss: 0.627
[2m[36m(pid=9741)[0m [1, 10000] loss: 0.381
[2m[36m(pid=9670)[0m [1, 12000] loss: 0.389
Result for DEFAULT_e1931_00063:
  accuracy: 0.4622
  date: 2020-11-13_14-58-40
  done: true
  experiment_id:

[2m[36m(pid=8652)[0m [2, 16000] loss: 0.195
[2m[36m(pid=10275)[0m Files already downloaded and verified
[2m[36m(pid=10057)[0m [2,  2000] loss: 1.457
Result for DEFAULT_e1931_00074:
  accuracy: 0.247
  date: 2020-11-13_14-58-48
  done: true
  experiment_id: 2b94fef4f24048968652a8b6a227499d
  experiment_tag: 74_batch_size=8,l1=128,l2=32,lr=0.00029838
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.0770970610618593
  node_ip: 145.52.252.20
  pid: 10055
  should_checkpoint: true
  time_since_restore: 45.25376605987549
  time_this_iter_s: 45.25376605987549
  time_total_s: 45.25376605987549
  timestamp: 1605275928
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00074
  
[2m[36m(pid=10275)[0m Files already downloaded and verified
[2m[36m(pid=9885)[0m [1, 10000] loss: 0.448
[2m[36m(pid=9952)[0m [1,  8000] loss: 0.437
[2m[36m(pid=9670)[0m [1, 14000] loss: 0.333
[2m[36m(pid=10317)[0m Files already downloaded and verified
Result for DEF

[2m[36m(pid=10418)[0m Files already downloaded and verified
[2m[36m(pid=10275)[0m [1,  2000] loss: 2.248
[2m[36m(pid=9670)[0m [1, 16000] loss: 0.291
[2m[36m(pid=9952)[0m [1, 10000] loss: 0.333
[2m[36m(pid=9741)[0m [1, 14000] loss: 0.253
[2m[36m(pid=10142)[0m [2,  2000] loss: 1.689
[2m[36m(pid=10317)[0m [1,  2000] loss: 2.309
[2m[36m(pid=5378)[0m [4, 18000] loss: 0.137
[2m[36m(pid=10057)[0m [3,  2000] loss: 1.358
[2m[36m(pid=10486)[0m Files already downloaded and verified
[2m[36m(pid=10234)[0m [1,  4000] loss: 1.125
[2m[36m(pid=10486)[0m Files already downloaded and verified
[2m[36m(pid=5383)[0m [5,  8000] loss: 0.263
[2m[36m(pid=9558)[0m [1, 18000] loss: 0.175
[2m[36m(pid=10376)[0m [1,  2000] loss: 1.846
[2m[36m(pid=10032)[0m [2,  4000] loss: 0.705
[2m[36m(pid=8652)[0m [2, 20000] loss: 0.152
Result for DEFAULT_e1931_00075:
  accuracy: 0.4828
  date: 2020-11-13_14-59-12
  done: false
  experiment_id: 026c16fc9d22453192e6200a12ddedf9
  e

Result for DEFAULT_e1931_00081:
  accuracy: 0.3933
  date: 2020-11-13_14-59-20
  done: false
  experiment_id: d149b3316d9647859ed7c65f048bc884
  experiment_tag: 81_batch_size=16,l1=8,l2=8,lr=0.0034765
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.6131854351997374
  node_ip: 145.52.252.20
  pid: 10418
  should_checkpoint: true
  time_since_restore: 27.63779306411743
  time_this_iter_s: 27.63779306411743
  time_total_s: 27.63779306411743
  timestamp: 1605275960
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00081
  
[2m[36m(pid=5383)[0m [5, 10000] loss: 0.207
[2m[36m(pid=9558)[0m [1, 20000] loss: 0.154
Result for DEFAULT_e1931_00073:
  accuracy: 0.5187
  date: 2020-11-13_14-59-21
  done: false
  experiment_id: 6a04558712dc4649bed35a6da7fba193
  experiment_tag: 73_batch_size=8,l1=32,l2=256,lr=0.0013334
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.343193664240837
  node_ip: 145.52.252.20
  pid: 10032
  should_checkpoint: true
 



Result for DEFAULT_e1931_00076:
  accuracy: 0.4054
  date: 2020-11-13_14-59-25
  done: true
  experiment_id: a12b4e1a466546ce944d57ddef2250c9
  experiment_tag: 76_batch_size=8,l1=4,l2=32,lr=0.0063324
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.5930275287628173
  node_ip: 145.52.252.20
  pid: 10142
  should_checkpoint: true
  time_since_restore: 74.40002608299255
  time_this_iter_s: 33.54141545295715
  time_total_s: 74.40002608299255
  timestamp: 1605275965
  timesteps_since_restore: 0
  training_iteration: 2
  trial_id: e1931_00076
  
[2m[36m(pid=10057)[0m [4,  2000] loss: 1.300


2020-11-13 14:59:26,418	INFO (unknown file):0 -- gc.collect() freed 236 refs in 0.2513187304139137 seconds


[2m[36m(pid=9670)[0m [1, 20000] loss: 0.233
[2m[36m(pid=10597)[0m Files already downloaded and verified
[2m[36m(pid=9952)[0m [1, 14000] loss: 0.222
[2m[36m(pid=9741)[0m [1, 18000] loss: 0.186
[2m[36m(pid=10597)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00079:
  accuracy: 0.1004
  date: 2020-11-13_14-59-28
  done: true
  experiment_id: a0fa005f0c404fad83fb2b0f2e41661f
  experiment_tag: 79_batch_size=8,l1=32,l2=16,lr=0.00012859
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.2975608350753784
  node_ip: 145.52.252.20
  pid: 10317
  should_checkpoint: true
  time_since_restore: 43.5386323928833
  time_this_iter_s: 43.5386323928833
  time_total_s: 43.5386323928833
  timestamp: 1605275968
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00079
  
[2m[36m(pid=10376)[0m [2,  2000] loss: 1.414
Result for DEFAULT_e1931_00082:
  accuracy: 0.4592
  date: 2020-11-13_14-59-29
  done: false
  experiment_id: 10f0e250dce744708

[2m[36m(pid=10787)[0m Files already downloaded and verified
[2m[36m(pid=10275)[0m [2,  2000] loss: 1.527
Result for DEFAULT_e1931_00081:
  accuracy: 0.4389
  date: 2020-11-13_14-59-40
  done: true
  experiment_id: d149b3316d9647859ed7c65f048bc884
  experiment_tag: 81_batch_size=16,l1=8,l2=8,lr=0.0034765
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.5085203742027282
  node_ip: 145.52.252.20
  pid: 10418
  should_checkpoint: true
  time_since_restore: 47.27505350112915
  time_this_iter_s: 19.63726043701172
  time_total_s: 47.27505350112915
  timestamp: 1605275980
  timesteps_since_restore: 0
  training_iteration: 2
  trial_id: e1931_00081
  
== Status ==
Memory usage on this node: 48.9/94.3 GiB
Using AsyncHyperBand: num_stopped=69
Bracket: Iter 16.000: None | Iter 8.000: -1.2510012845462188 | Iter 4.000: -1.2585972864810377 | Iter 2.000: -1.4855667536824941 | Iter 1.000: -1.865479642009735
Resources requested: 32/40 CPUs, 4.0/4 GPUs, 0.0/53.52 GiB heap, 0.0/18.46 Gi

[2m[36m(pid=10744)[0m [1,  2000] loss: 1.934
[2m[36m(pid=10926)[0m Files already downloaded and verified
[2m[36m(pid=10275)[0m [2,  4000] loss: 0.733
[2m[36m(pid=10787)[0m [1,  2000] loss: 1.964
Result for DEFAULT_e1931_00080:
  accuracy: 0.5513
  date: 2020-11-13_14-59-52
  done: false
  experiment_id: 408692bcd20d47d1a5943f691daef7d1
  experiment_tag: 80_batch_size=16,l1=128,l2=128,lr=0.0034125
  hostname: gpuserver
  iterations_since_restore: 3
  loss: 1.2758308347702025
  node_ip: 145.52.252.20
  pid: 10376
  should_checkpoint: true
  time_since_restore: 62.531853914260864
  time_this_iter_s: 17.544098615646362
  time_total_s: 62.531853914260864
  timestamp: 1605275992
  timesteps_since_restore: 0
  training_iteration: 3
  trial_id: e1931_00080
  
[2m[36m(pid=10978)[0m Files already downloaded and verified
[2m[36m(pid=9558)[0m [2,  2000] loss: 1.516
[2m[36m(pid=9952)[0m [1, 18000] loss: 0.171
[2m[36m(pid=10597)[0m [1,  4000] loss: 0.994
[2m[36m(pid=10978)

[2m[36m(pid=10486)[0m [3,  2000] loss: 1.226
[2m[36m(pid=10787)[0m [1,  4000] loss: 0.786
[2m[36m(pid=10926)[0m [1,  2000] loss: 2.283
[2m[36m(pid=11071)[0m Files already downloaded and verified
[2m[36m(pid=10376)[0m [4,  2000] loss: 1.139
[2m[36m(pid=11071)[0m Files already downloaded and verified
[2m[36m(pid=9558)[0m [2,  4000] loss: 0.748
[2m[36m(pid=9952)[0m [1, 20000] loss: 0.149
[2m[36m(pid=10597)[0m [1,  6000] loss: 0.624
[2m[36m(pid=8652)[0m [3,  6000] loss: 0.486
[2m[36m(pid=10978)[0m [1,  2000] loss: 2.301
Result for DEFAULT_e1931_00082:
  accuracy: 0.5625
  date: 2020-11-13_15-00-07
  done: false
  experiment_id: 10f0e250dce744708149535be64b5baf
  experiment_tag: 82_batch_size=16,l1=256,l2=256,lr=0.0034061
  hostname: gpuserver
  iterations_since_restore: 3
  loss: 1.2363892024040222
  node_ip: 145.52.252.20
  pid: 10486
  should_checkpoint: true
  time_since_restore: 66.17424154281616
  time_this_iter_s: 18.963034629821777
  time_total_s: 66

[2m[36m(pid=10926)[0m [1,  4000] loss: 1.052
[2m[36m(pid=9558)[0m [2,  6000] loss: 0.490
[2m[36m(pid=10597)[0m [1,  8000] loss: 0.451
[2m[36m(pid=11071)[0m [1,  2000] loss: 2.241
[2m[36m(pid=10978)[0m [1,  4000] loss: 1.140
[2m[36m(pid=8652)[0m [3,  8000] loss: 0.364
[2m[36m(pid=10486)[0m [4,  2000] loss: 1.114
[2m[36m(pid=5383)[0m [5, 20000] loss: 0.110
[2m[36m(pid=10848)[0m [1,  6000] loss: 0.776
[2m[36m(pid=10032)[0m [4,  4000] loss: 0.604
[2m[36m(pid=10376)[0m [5,  2000] loss: 1.056
[2m[36m(pid=9741)[0m [2,  4000] loss: 0.800
[2m[36m(pid=5378)[0m [5,  8000] loss: 0.301
[2m[36m(pid=10275)[0m [3,  4000] loss: 0.694
Result for DEFAULT_e1931_00071:
  accuracy: 0.4846
  date: 2020-11-13_15-00-24
  done: false
  experiment_id: 23398555c4374eddb57f04adf07f73e7
  experiment_tag: 71_batch_size=2,l1=256,l2=64,lr=0.0006568
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.4321192227229476
  node_ip: 145.52.252.20
  pid: 9952
  should_check

2020-11-13 15:00:26,626	INFO (unknown file):0 -- gc.collect() freed 245 refs in 0.1704423502087593 seconds


Result for DEFAULT_e1931_00080:
  accuracy: 0.5984
  date: 2020-11-13_15-00-27
  done: false
  experiment_id: 408692bcd20d47d1a5943f691daef7d1
  experiment_tag: 80_batch_size=16,l1=128,l2=128,lr=0.0034125
  hostname: gpuserver
  iterations_since_restore: 5
  loss: 1.1685956188201905
  node_ip: 145.52.252.20
  pid: 10376
  should_checkpoint: true
  time_since_restore: 97.50431728363037
  time_this_iter_s: 17.502463340759277
  time_total_s: 97.50431728363037
  timestamp: 1605276027
  timesteps_since_restore: 0
  training_iteration: 5
  trial_id: e1931_00080
  
[2m[36m(pid=9558)[0m [2,  8000] loss: 0.364
[2m[36m(pid=10597)[0m [1, 10000] loss: 0.355
[2m[36m(pid=11071)[0m [1,  4000] loss: 1.012
Result for DEFAULT_e1931_00088:
  accuracy: 0.2231
  date: 2020-11-13_15-00-30
  done: true
  experiment_id: 41c985855a4742939caa5a56193b0174
  experiment_tag: 88_batch_size=8,l1=16,l2=256,lr=0.00017206
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 2.131662745475769
  node_ip: 

[2m[36m(pid=9741)[0m [2,  6000] loss: 0.525
[2m[36m(pid=11261)[0m Files already downloaded and verified
[2m[36m(pid=10787)[0m [2,  4000] loss: 0.671
[2m[36m(pid=9952)[0m [2,  2000] loss: 1.435
Result for DEFAULT_e1931_00022:
  accuracy: 0.5965
  date: 2020-11-13_15-00-38
  done: false
  experiment_id: 404de1e772c348bbbb13fbf8b98542c2
  experiment_tag: 22_batch_size=2,l1=256,l2=32,lr=0.00073597
  hostname: gpuserver
  iterations_since_restore: 5
  loss: 1.1714350928676547
  node_ip: 145.52.252.20
  pid: 5383
  should_checkpoint: true
  time_since_restore: 688.6652851104736
  time_this_iter_s: 136.63210892677307
  time_total_s: 688.6652851104736
  timestamp: 1605276038
  timesteps_since_restore: 0
  training_iteration: 5
  trial_id: e1931_00022
  
[2m[36m(pid=11302)[0m Files already downloaded and verified
[2m[36m(pid=10486)[0m [5,  2000] loss: 1.018
[2m[36m(pid=10376)[0m [6,  2000] loss: 0.973
[2m[36m(pid=11302)[0m Files already downloaded and verified
[2m[36m(

[2m[36m(pid=9952)[0m [2,  6000] loss: 0.469
Result for DEFAULT_e1931_00082:
  accuracy: 0.6196
  date: 2020-11-13_15-01-02
  done: false
  experiment_id: 10f0e250dce744708149535be64b5baf
  experiment_tag: 82_batch_size=16,l1=256,l2=256,lr=0.0034061
  hostname: gpuserver
  iterations_since_restore: 6
  loss: 1.0958491794109344
  node_ip: 145.52.252.20
  pid: 10486
  should_checkpoint: true
  time_since_restore: 121.00583791732788
  time_this_iter_s: 18.104461908340454
  time_total_s: 121.00583791732788
  timestamp: 1605276062
  timesteps_since_restore: 0
  training_iteration: 6
  trial_id: e1931_00082
  
== Status ==
Memory usage on this node: 49.1/94.3 GiB
Using AsyncHyperBand: num_stopped=73
Bracket: Iter 16.000: None | Iter 8.000: -1.2510012845462188 | Iter 4.000: -1.228159960180521 | Iter 2.000: -1.46796318025589 | Iter 1.000: -1.865479642009735
Resources requested: 32/40 CPUs, 4.0/4 GPUs, 0.0/53.52 GiB heap, 0.0/18.46 GiB objects (0/1.0 accelerator_type:RTX)
Result logdir: /home

[2m[36m(pid=10787)[0m [3,  4000] loss: 0.599
[2m[36m(pid=5378)[0m [5, 16000] loss: 0.147
[2m[36m(pid=10848)[0m [1, 14000] loss: 0.332
Result for DEFAULT_e1931_00090:
  accuracy: 0.458
  date: 2020-11-13_15-01-11
  done: false
  experiment_id: a3ed4b479675481e8f7d4ce3e5fbbcd7
  experiment_tag: 90_batch_size=8,l1=16,l2=32,lr=0.0016719
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.4772080944538117
  node_ip: 145.52.252.20
  pid: 11261
  should_checkpoint: true
  time_since_restore: 43.80416798591614
  time_this_iter_s: 43.80416798591614
  time_total_s: 43.80416798591614
  timestamp: 1605276071
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00090
  
[2m[36m(pid=9741)[0m [2, 12000] loss: 0.256
[2m[36m(pid=5383)[0m [6,  6000] loss: 0.328
[2m[36m(pid=9952)[0m [2,  8000] loss: 0.341
[2m[36m(pid=10376)[0m [8,  2000] loss: 0.862
[2m[36m(pid=10486)[0m [7,  2000] loss: 0.854
Result for DEFAULT_e1931_00091:
  accuracy: 0.4769
  date: 2

Result for DEFAULT_e1931_00080:
  accuracy: 0.6305
  date: 2020-11-13_15-01-20
  done: false
  experiment_id: 408692bcd20d47d1a5943f691daef7d1
  experiment_tag: 80_batch_size=16,l1=128,l2=128,lr=0.0034125
  hostname: gpuserver
  iterations_since_restore: 8
  loss: 1.106956447839737
  node_ip: 145.52.252.20
  pid: 10376
  should_checkpoint: true
  time_since_restore: 150.28827333450317
  time_this_iter_s: 17.48623490333557
  time_total_s: 150.28827333450317
  timestamp: 1605276080
  timesteps_since_restore: 0
  training_iteration: 8
  trial_id: e1931_00080
  
Result for DEFAULT_e1931_00082:
  accuracy: 0.6142
  date: 2020-11-13_15-01-20
  done: false
  experiment_id: 10f0e250dce744708149535be64b5baf
  experiment_tag: 82_batch_size=16,l1=256,l2=256,lr=0.0034061
  hostname: gpuserver
  iterations_since_restore: 7
  loss: 1.1427586791038513
  node_ip: 145.52.252.20
  pid: 10486
  should_checkpoint: true
  time_since_restore: 139.57081246376038
  time_this_iter_s: 18.564974546432495
  time_

[2m[36m(pid=9558)[0m [2, 20000] loss: 0.135
[2m[36m(pid=10787)[0m [4,  4000] loss: 0.562
[2m[36m(pid=11493)[0m [1,  4000] loss: 1.159
Result for DEFAULT_e1931_00090:
  accuracy: 0.5231
  date: 2020-11-13_15-01-46
  done: false
  experiment_id: a3ed4b479675481e8f7d4ce3e5fbbcd7
  experiment_tag: 90_batch_size=8,l1=16,l2=32,lr=0.0016719
  hostname: gpuserver
  iterations_since_restore: 2
  loss: 1.3261580924749374
  node_ip: 145.52.252.20
  pid: 11261
  should_checkpoint: true
  time_since_restore: 78.25902271270752
  time_this_iter_s: 34.45485472679138
  time_total_s: 78.25902271270752
  timestamp: 1605276106
  timesteps_since_restore: 0
  training_iteration: 2
  trial_id: e1931_00090
  
== Status ==
Memory usage on this node: 48.9/94.3 GiB
Using AsyncHyperBand: num_stopped=74
Bracket: Iter 16.000: None | Iter 8.000: -1.1616001242041587 | Iter 4.000: -1.2300583099722862 | Iter 2.000: -1.4646864913463593 | Iter 1.000: -1.8478457763671876
Resources requested: 32/40 CPUs, 4.0/4 GPU

[2m[36m(pid=10486)[0m [9,  2000] loss: 0.713
[2m[36m(pid=11071)[0m [1, 18000] loss: 0.170
[2m[36m(pid=10032)[0m [7,  2000] loss: 1.063
Result for DEFAULT_e1931_00085:
  accuracy: 0.5807
  date: 2020-11-13_15-01-53
  done: false
  experiment_id: 30eec32b237741a4a0e140cbd0602ca6
  experiment_tag: 85_batch_size=8,l1=128,l2=128,lr=0.0026019
  hostname: gpuserver
  iterations_since_restore: 4
  loss: 1.2098377489089966
  node_ip: 145.52.252.20
  pid: 10787
  should_checkpoint: true
  time_since_restore: 143.49812602996826
  time_this_iter_s: 33.45432233810425
  time_total_s: 143.49812602996826
  timestamp: 1605276113
  timesteps_since_restore: 0
  training_iteration: 4
  trial_id: e1931_00085
  
[2m[36m(pid=11493)[0m [1,  6000] loss: 0.771
Result for DEFAULT_e1931_00080:
  accuracy: 0.6163
  date: 2020-11-13_15-01-55
  done: false
  experiment_id: 408692bcd20d47d1a5943f691daef7d1
  experiment_tag: 80_batch_size=16,l1=128,l2=128,lr=0.0034125
  hostname: gpuserver
  iterations_sin

[2m[36m(pid=11493)[0m [1,  8000] loss: 0.578
[2m[36m(pid=10486)[0m [10,  2000] loss: 0.646
[2m[36m(pid=11261)[0m [3,  4000] loss: 0.655
[2m[36m(pid=10597)[0m [2,  4000] loss: 0.835
[2m[36m(pid=5383)[0m [6, 16000] loss: 0.129
[2m[36m(pid=9558)[0m [3,  2000] loss: 1.309
[2m[36m(pid=11854)[0m Files already downloaded and verified
[2m[36m(pid=11302)[0m [3,  4000] loss: 0.605
[2m[36m(pid=5378)[0m [6,  4000] loss: 0.570
[2m[36m(pid=11854)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00082:
  accuracy: 0.6011
  date: 2020-11-13_15-02-15
  done: false
  experiment_id: 10f0e250dce744708149535be64b5baf
  experiment_tag: 82_batch_size=16,l1=256,l2=256,lr=0.0034061
  hostname: gpuserver
  iterations_since_restore: 10
  loss: 1.2565842367172242
  node_ip: 145.52.252.20
  pid: 10486
  should_checkpoint: true
  time_since_restore: 194.26350235939026
  time_this_iter_s: 18.21313762664795
  time_total_s: 194.26350235939026
  timestamp: 1605276135
  tim

[2m[36m(pid=10597)[0m [2,  6000] loss: 0.554
[2m[36m(pid=11905)[0m Files already downloaded and verified
[2m[36m(pid=5383)[0m [6, 18000] loss: 0.112
Result for DEFAULT_e1931_00091:
  accuracy: 0.5737
  date: 2020-11-13_15-02-24
  done: false
  experiment_id: f75cb8613c494c268bb1378a294938d2
  experiment_tag: 91_batch_size=8,l1=256,l2=64,lr=0.0025626
  hostname: gpuserver
  iterations_since_restore: 3
  loss: 1.211514049220085
  node_ip: 145.52.252.20
  pid: 11302
  should_checkpoint: true
  time_since_restore: 112.62610673904419
  time_this_iter_s: 35.143972396850586
  time_total_s: 112.62610673904419
  timestamp: 1605276144
  timesteps_since_restore: 0
  training_iteration: 3
  trial_id: e1931_00091
  
[2m[36m(pid=11905)[0m Files already downloaded and verified
[2m[36m(pid=9558)[0m [3,  4000] loss: 0.644
[2m[36m(pid=5378)[0m [6,  6000] loss: 0.382
[2m[36m(pid=11954)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00085:
  accuracy: 0.5871
  date:

[2m[36m(pid=10597)[0m [2,  8000] loss: 0.417
[2m[36m(pid=12033)[0m Files already downloaded and verified
[2m[36m(pid=5383)[0m [6, 20000] loss: 0.101
[2m[36m(pid=11302)[0m [4,  2000] loss: 1.101
[2m[36m(pid=12033)[0m Files already downloaded and verified
[2m[36m(pid=9558)[0m [3,  6000] loss: 0.433
[2m[36m(pid=5378)[0m [6,  8000] loss: 0.283
[2m[36m(pid=11905)[0m [1,  2000] loss: 2.040
Result for DEFAULT_e1931_00093:
  accuracy: 0.3679
  date: 2020-11-13_15-02-38
  done: false
  experiment_id: 02639f49b2f844258a1719fe86f9881a
  experiment_tag: 93_batch_size=8,l1=8,l2=256,lr=0.0086422
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.7177105865955353
  node_ip: 145.52.252.20
  pid: 11784
  should_checkpoint: true
  time_since_restore: 41.10854768753052
  time_this_iter_s: 41.10854768753052
  time_total_s: 41.10854768753052
  timestamp: 1605276158
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00093
  
[2m[36m(pid=10787)[0m [6,

[2m[36m(pid=12161)[0m Files already downloaded and verified
[2m[36m(pid=11954)[0m [1,  4000] loss: 1.162
[2m[36m(pid=8652)[0m [4, 10000] loss: 0.263
[2m[36m(pid=12161)[0m Files already downloaded and verified
Result for DEFAULT_e1931_00022:
  accuracy: 0.6035
  date: 2020-11-13_15-02-54
  done: false
  experiment_id: 404de1e772c348bbbb13fbf8b98542c2
  experiment_tag: 22_batch_size=2,l1=256,l2=32,lr=0.00073597
  hostname: gpuserver
  iterations_since_restore: 6
  loss: 1.1860738186916207
  node_ip: 145.52.252.20
  pid: 5383
  should_checkpoint: true
  time_since_restore: 824.6319661140442
  time_this_iter_s: 135.96668100357056
  time_total_s: 824.6319661140442
  timestamp: 1605276174
  timesteps_since_restore: 0
  training_iteration: 6
  trial_id: e1931_00022
  
Result for DEFAULT_e1931_00090:
  accuracy: 0.5591
  date: 2020-11-13_15-02-55
  done: true
  experiment_id: a3ed4b479675481e8f7d4ce3e5fbbcd7
  experiment_tag: 90_batch_size=8,l1=16,l2=32,lr=0.0016719
  hostname: gpu

[2m[36m(pid=10597)[0m [2, 14000] loss: 0.238
[2m[36m(pid=11302)[0m [5,  2000] loss: 0.988
[2m[36m(pid=10787)[0m [7,  2000] loss: 0.918
[2m[36m(pid=5378)[0m [6, 14000] loss: 0.160
[2m[36m(pid=9558)[0m [3, 12000] loss: 0.209
[2m[36m(pid=12033)[0m [1,  6000] loss: 0.774
[2m[36m(pid=8652)[0m [4, 14000] loss: 0.188
[2m[36m(pid=5383)[0m [7,  4000] loss: 0.438
[2m[36m(pid=12161)[0m [1,  4000] loss: 0.800
[2m[36m(pid=11071)[0m [2, 10000] loss: 0.294
[2m[36m(pid=9952)[0m [3,  6000] loss: 0.419
[2m[36m(pid=12100)[0m [1,  6000] loss: 0.767
[2m[36m(pid=10597)[0m [2, 16000] loss: 0.209
[2m[36m(pid=10787)[0m [7,  4000] loss: 0.479
[2m[36m(pid=11302)[0m [5,  4000] loss: 0.515
[2m[36m(pid=5378)[0m [6, 16000] loss: 0.142
[2m[36m(pid=9558)[0m [3, 14000] loss: 0.185
[2m[36m(pid=12033)[0m [1,  8000] loss: 0.580
[2m[36m(pid=8652)[0m [4, 16000] loss: 0.161
[2m[36m(pid=5383)[0m [7,  6000] loss: 0.298
Result for DEFAULT_e1931_00099:
  accuracy: 0.471

== Status ==
Memory usage on this node: 38.0/94.3 GiB
Using AsyncHyperBand: num_stopped=83
Bracket: Iter 16.000: None | Iter 8.000: -1.1630976619422435 | Iter 4.000: -1.228159960180521 | Iter 2.000: -1.4614098024368287 | Iter 1.000: -1.8566627091884613
Resources requested: 24/40 CPUs, 3.0/4 GPUs, 0.0/53.52 GiB heap, 0.0/18.46 GiB objects (0/1.0 accelerator_type:RTX)
Result logdir: /home/brian/ray_results/DEFAULT
Number of trials: 100 (12 RUNNING, 88 TERMINATED)
+---------------------+------------+---------------------+--------------+------+------+-------------+---------+------------+----------------------+
| Trial name          | status     | loc                 |   batch_size |   l1 |   l2 |          lr |    loss |   accuracy |   training_iteration |
|---------------------+------------+---------------------+--------------+------+------+-------------+---------+------------+----------------------|
| DEFAULT_e1931_00022 | RUNNING    | 145.52.252.20:5383  |            2 |  256 |   32 | 0.

[2m[36m(pid=12100)[0m [1, 14000] loss: 0.302
[2m[36m(pid=9952)[0m [3, 14000] loss: 0.177
[2m[36m(pid=5378)[0m [7,  2000] loss: 1.075
[2m[36m(pid=5383)[0m [7, 14000] loss: 0.133
[2m[36m(pid=12033)[0m [1, 16000] loss: 0.290
[2m[36m(pid=11071)[0m [2, 20000] loss: 0.142
[2m[36m(pid=12161)[0m [3,  2000] loss: 1.250
[2m[36m(pid=11302)[0m [7,  2000] loss: 0.840
Result for DEFAULT_e1931_00065:
  accuracy: 0.5606
  date: 2020-11-13_15-04-18
  done: false
  experiment_id: b01972942689499c8185bc4668ba47fc
  experiment_tag: 65_batch_size=2,l1=64,l2=32,lr=0.00044146
  hostname: gpuserver
  iterations_since_restore: 3
  loss: 1.2565351666620002
  node_ip: 145.52.252.20
  pid: 9558
  should_checkpoint: true
  time_since_restore: 429.21035146713257
  time_this_iter_s: 137.34790086746216
  time_total_s: 429.21035146713257
  timestamp: 1605276258
  timesteps_since_restore: 0
  training_iteration: 3
  trial_id: e1931_00065
  
== Status ==
Memory usage on this node: 30.1/94.3 GiB
U

[2m[36m(pid=11302)[0m [7,  4000] loss: 0.454
[2m[36m(pid=12100)[0m [1, 18000] loss: 0.224
[2m[36m(pid=9558)[0m [4,  2000] loss: 1.170
[2m[36m(pid=9952)[0m [3, 18000] loss: 0.134
[2m[36m(pid=5378)[0m [7,  6000] loss: 0.357
[2m[36m(pid=5383)[0m [7, 18000] loss: 0.103
[2m[36m(pid=12033)[0m [1, 20000] loss: 0.232
Result for DEFAULT_e1931_00099:
  accuracy: 0.5565
  date: 2020-11-13_15-04-36
  done: false
  experiment_id: 89d07c4d0c5f4dd9bf3bdb99a5e5a074
  experiment_tag: 99_batch_size=8,l1=256,l2=32,lr=0.0035387
  hostname: gpuserver
  iterations_since_restore: 3
  loss: 1.2445476999521254
  node_ip: 145.52.252.20
  pid: 12161
  should_checkpoint: true
  time_since_restore: 111.03524041175842
  time_this_iter_s: 32.974355697631836
  time_total_s: 111.03524041175842
  timestamp: 1605276276
  timesteps_since_restore: 0
  training_iteration: 3
  trial_id: e1931_00099
  
== Status ==
Memory usage on this node: 30.1/94.3 GiB
Using AsyncHyperBand: num_stopped=86
Bracket: Ite

Result for DEFAULT_e1931_00098:
  accuracy: 0.2594
  date: 2020-11-13_15-04-53
  done: true
  experiment_id: 4b670baea5c3433ebac79574acd13122
  experiment_tag: 98_batch_size=2,l1=128,l2=8,lr=0.00016041
  hostname: gpuserver
  iterations_since_restore: 1
  loss: 1.9386106283307076
  node_ip: 145.52.252.20
  pid: 12100
  should_checkpoint: true
  time_since_restore: 136.74322533607483
  time_this_iter_s: 136.74322533607483
  time_total_s: 136.74322533607483
  timestamp: 1605276293
  timesteps_since_restore: 0
  training_iteration: 1
  trial_id: e1931_00098
  
[2m[36m(pid=9558)[0m [4,  6000] loss: 0.399
Result for DEFAULT_e1931_00022:
  accuracy: 0.5788
  date: 2020-11-13_15-04-56
  done: false
  experiment_id: 404de1e772c348bbbb13fbf8b98542c2
  experiment_tag: 22_batch_size=2,l1=256,l2=32,lr=0.00073597
  hostname: gpuserver
  iterations_since_restore: 7
  loss: 1.280665869098861
  node_ip: 145.52.252.20
  pid: 5383
  should_checkpoint: true
  time_since_restore: 946.9602155685425
  ti

[2m[36m(pid=11071)[0m [3,  8000] loss: 0.345
[2m[36m(pid=9952)[0m [4,  2000] loss: 1.087
Result for DEFAULT_e1931_00099:
  accuracy: 0.5995
  date: 2020-11-13_15-05-09
  done: false
  experiment_id: 89d07c4d0c5f4dd9bf3bdb99a5e5a074
  experiment_tag: 99_batch_size=8,l1=256,l2=32,lr=0.0035387
  hostname: gpuserver
  iterations_since_restore: 4
  loss: 1.150946010285616
  node_ip: 145.52.252.20
  pid: 12161
  should_checkpoint: true
  time_since_restore: 143.9420759677887
  time_this_iter_s: 32.90683555603027
  time_total_s: 143.9420759677887
  timestamp: 1605276309
  timesteps_since_restore: 0
  training_iteration: 4
  trial_id: e1931_00099
  
[2m[36m(pid=5378)[0m [7, 14000] loss: 0.156
[2m[36m(pid=9558)[0m [4, 10000] loss: 0.237
[2m[36m(pid=5383)[0m [8,  4000] loss: 0.407
[2m[36m(pid=11071)[0m [3, 10000] loss: 0.276
[2m[36m(pid=11302)[0m [9,  2000] loss: 0.736
[2m[36m(pid=9952)[0m [4,  4000] loss: 0.555
[2m[36m(pid=12161)[0m [5,  2000] loss: 1.064
[2m[36m(pi

[2m[36m(pid=5383)[0m [8, 12000] loss: 0.148
[2m[36m(pid=11071)[0m [3, 18000] loss: 0.152
[2m[36m(pid=9558)[0m [4, 18000] loss: 0.134
[2m[36m(pid=11302)[0m [10,  4000] loss: 0.383
[2m[36m(pid=12161)[0m [6,  4000] loss: 0.517
[2m[36m(pid=9952)[0m [4, 12000] loss: 0.194
[2m[36m(pid=5378)[0m [8,  2000] loss: 1.061
[2m[36m(pid=5383)[0m [8, 14000] loss: 0.129
[2m[36m(pid=11071)[0m [3, 20000] loss: 0.138
Result for DEFAULT_e1931_00091:
  accuracy: 0.6047
  date: 2020-11-13_15-06-09
  done: false
  experiment_id: f75cb8613c494c268bb1378a294938d2
  experiment_tag: 91_batch_size=8,l1=256,l2=64,lr=0.0025626
  hostname: gpuserver
  iterations_since_restore: 10
  loss: 1.294284700459242
  node_ip: 145.52.252.20
  pid: 11302
  should_checkpoint: true
  time_since_restore: 337.63283133506775
  time_this_iter_s: 30.3942551612854
  time_total_s: 337.63283133506775
  timestamp: 1605276369
  timesteps_since_restore: 0
  training_iteration: 10
  trial_id: e1931_00091
  
== Statu

[2m[36m(pid=9952)[0m [4, 16000] loss: 0.139
[2m[36m(pid=5378)[0m [8,  6000] loss: 0.357
Result for DEFAULT_e1931_00065:
  accuracy: 0.5428
  date: 2020-11-13_15-06-27
  done: true
  experiment_id: b01972942689499c8185bc4668ba47fc
  experiment_tag: 65_batch_size=2,l1=64,l2=32,lr=0.00044146
  hostname: gpuserver
  iterations_since_restore: 4
  loss: 1.2881728448329492
  node_ip: 145.52.252.20
  pid: 9558
  should_checkpoint: true
  time_since_restore: 558.2624471187592
  time_this_iter_s: 129.0520956516266
  time_total_s: 558.2624471187592
  timestamp: 1605276387
  timesteps_since_restore: 0
  training_iteration: 4
  trial_id: e1931_00065
  
[2m[36m(pid=5383)[0m [8, 18000] loss: 0.100
[2m[36m(pid=11071)[0m [4,  2000] loss: 1.322
[2m[36m(pid=9952)[0m [4, 18000] loss: 0.122
[2m[36m(pid=12161)[0m [7,  4000] loss: 0.493
[2m[36m(pid=5378)[0m [8,  8000] loss: 0.265
[2m[36m(pid=5383)[0m [8, 20000] loss: 0.093
Result for DEFAULT_e1931_00099:
  accuracy: 0.5927
  date: 202

[2m[36m(pid=11071)[0m [4,  6000] loss: 0.449
[2m[36m(pid=12161)[0m [8,  2000] loss: 0.896
[2m[36m(pid=5378)[0m [8, 12000] loss: 0.178
Result for DEFAULT_e1931_00071:
  accuracy: 0.5885
  date: 2020-11-13_15-06-57
  done: false
  experiment_id: 23398555c4374eddb57f04adf07f73e7
  experiment_tag: 71_batch_size=2,l1=256,l2=64,lr=0.0006568
  hostname: gpuserver
  iterations_since_restore: 4
  loss: 1.1859949432839174
  node_ip: 145.52.252.20
  pid: 9952
  should_checkpoint: true
  time_since_restore: 546.2173924446106
  time_this_iter_s: 118.61144280433655
  time_total_s: 546.2173924446106
  timestamp: 1605276417
  timesteps_since_restore: 0
  training_iteration: 4
  trial_id: e1931_00071
  
[2m[36m(pid=11071)[0m [4,  8000] loss: 0.337
[2m[36m(pid=12161)[0m [8,  4000] loss: 0.466
[2m[36m(pid=5378)[0m [8, 14000] loss: 0.151
[2m[36m(pid=9952)[0m [5,  2000] loss: 1.027
[2m[36m(pid=11071)[0m [4, 10000] loss: 0.264
Result for DEFAULT_e1931_00099:
  accuracy: 0.5918
  date

[2m[36m(pid=9952)[0m [5, 10000] loss: 0.206
[2m[36m(pid=11071)[0m [4, 18000] loss: 0.149
[2m[36m(pid=5378)[0m [9,  2000] loss: 0.986
[2m[36m(pid=9952)[0m [5, 12000] loss: 0.174
[2m[36m(pid=11071)[0m [4, 20000] loss: 0.132
[2m[36m(pid=5378)[0m [9,  4000] loss: 0.515
[2m[36m(pid=9952)[0m [5, 14000] loss: 0.149
Result for DEFAULT_e1931_00089:
  accuracy: 0.531
  date: 2020-11-13_15-08-10
  done: true
  experiment_id: 546e9685646d4721ae65bebbbd8a8f04
  experiment_tag: 89_batch_size=2,l1=16,l2=64,lr=0.0010276
  hostname: gpuserver
  iterations_since_restore: 4
  loss: 1.3219737589376048
  node_ip: 145.52.252.20
  pid: 11071
  should_checkpoint: true
  time_since_restore: 493.25907373428345
  time_this_iter_s: 107.36341834068298
  time_total_s: 493.25907373428345
  timestamp: 1605276490
  timesteps_since_restore: 0
  training_iteration: 4
  trial_id: e1931_00089
  
== Status ==
Memory usage on this node: 14.0/94.3 GiB
Using AsyncHyperBand: num_stopped=92
Bracket: Iter 16

[2m[36m(pid=5378)[0m [9, 14000] loss: 0.147
[2m[36m(pid=9952)[0m [6,  2000] loss: 0.891
[2m[36m(pid=5378)[0m [9, 16000] loss: 0.130
[2m[36m(pid=9952)[0m [6,  4000] loss: 0.481
[2m[36m(pid=5378)[0m [9, 18000] loss: 0.116
[2m[36m(pid=9952)[0m [6,  6000] loss: 0.311
[2m[36m(pid=5378)[0m [9, 20000] loss: 0.105
[2m[36m(pid=9952)[0m [6,  8000] loss: 0.240
Result for DEFAULT_e1931_00031:
  accuracy: 0.6121
  date: 2020-11-13_15-09-28
  done: false
  experiment_id: 6a69e15f8e724840bef97b4a131e30f1
  experiment_tag: 31_batch_size=2,l1=32,l2=128,lr=0.00016403
  hostname: gpuserver
  iterations_since_restore: 9
  loss: 1.0976547864989377
  node_ip: 145.52.252.20
  pid: 5378
  should_checkpoint: true
  time_since_restore: 1138.325258731842
  time_this_iter_s: 104.34226298332214
  time_total_s: 1138.325258731842
  timestamp: 1605276568
  timesteps_since_restore: 0
  training_iteration: 9
  trial_id: e1931_00031
  
== Status ==
Memory usage on this node: 11.3/94.3 GiB
Using A

[2m[36m(pid=5378)[0m [10, 14000] loss: 0.144
[2m[36m(pid=9952)[0m [7,  2000] loss: 0.838
[2m[36m(pid=5378)[0m [10, 16000] loss: 0.126
[2m[36m(pid=9952)[0m [7,  4000] loss: 0.430
[2m[36m(pid=5378)[0m [10, 18000] loss: 0.110
[2m[36m(pid=9952)[0m [7,  6000] loss: 0.289
[2m[36m(pid=5378)[0m [10, 20000] loss: 0.102
[2m[36m(pid=9952)[0m [7,  8000] loss: 0.224
Result for DEFAULT_e1931_00031:
  accuracy: 0.6162
  date: 2020-11-13_15-11-10
  done: false
  experiment_id: 6a69e15f8e724840bef97b4a131e30f1
  experiment_tag: 31_batch_size=2,l1=32,l2=128,lr=0.00016403
  hostname: gpuserver
  iterations_since_restore: 10
  loss: 1.0928039968871512
  node_ip: 145.52.252.20
  pid: 5378
  should_checkpoint: true
  time_since_restore: 1240.8409352302551
  time_this_iter_s: 102.51567649841309
  time_total_s: 1240.8409352302551
  timestamp: 1605276670
  timesteps_since_restore: 0
  training_iteration: 10
  trial_id: e1931_00031
  
== Status ==
Memory usage on this node: 11.3/94.3 GiB

[2m[36m(pid=9952)[0m [8,  2000] loss: 0.801
[2m[36m(pid=9952)[0m [8,  4000] loss: 0.396
[2m[36m(pid=9952)[0m [8,  6000] loss: 0.272
[2m[36m(pid=9952)[0m [8,  8000] loss: 0.208
[2m[36m(pid=9952)[0m [8, 10000] loss: 0.175
[2m[36m(pid=9952)[0m [8, 12000] loss: 0.149
[2m[36m(pid=9952)[0m [8, 14000] loss: 0.121
[2m[36m(pid=9952)[0m [8, 16000] loss: 0.111
[2m[36m(pid=9952)[0m [8, 18000] loss: 0.096
[2m[36m(pid=9952)[0m [8, 20000] loss: 0.088
Result for DEFAULT_e1931_00071:
  accuracy: 0.6104
  date: 2020-11-13_15-14-01
  done: true
  experiment_id: 23398555c4374eddb57f04adf07f73e7
  experiment_tag: 71_batch_size=2,l1=256,l2=64,lr=0.0006568
  hostname: gpuserver
  iterations_since_restore: 8
  loss: 1.1834242239820676
  node_ip: 145.52.252.20
  pid: 9952
  should_checkpoint: true
  time_since_restore: 970.477646112442
  time_this_iter_s: 105.68485283851624
  time_total_s: 970.477646112442
  timestamp: 1605276841
  timesteps_since_restore: 0
  training_iteration: 

Best trial config: {'num_gpus': 0.25, 'num_cpus_for_driver': 1, 'num_cpus_per_worker': 1, 'num_workers': 2, 'l1': 32, 'l2': 128, 'lr': 0.00016403435434371365, 'batch_size': 2}
Best trial final validation loss: 1.0928039968871512
Best trial final validation accuracy: 0.6162
Files already downloaded and verified
Files already downloaded and verified
Best trial test set accuracy: 0.6147
