## Install Libraries


In [33]:
%pip install "ray[tune]"
# %pip install torch torchvision torchaudio # Uncomment this to install PyTorch 2.0+ on ilab (required version to run this program)

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/


## Import Libraries


In [34]:
from filelock import FileLock
from ray import tune
from ray.air import session
from ray.air.checkpoint import Checkpoint
from torch.utils.data import random_split
import os
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms
from collections import OrderedDict


## Data loaders


In [35]:
def load_data(data_dir="./data"):
    transform = transforms.Compose(
        [transforms.ToTensor(), transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))]
    )

    with FileLock(os.path.expanduser("~/.data.lock")):
        trainset = torchvision.datasets.CIFAR10(
            root=data_dir, train=True, download=True, transform=transform
        )

        testset = torchvision.datasets.CIFAR10(
            root=data_dir, train=False, download=True, transform=transform
        )

    return trainset, testset


## Configurable neural network


In [36]:
def flatten(x, start_dim=1, end_dim=-1):
    return x.flatten(start_dim=start_dim, end_dim=end_dim)


In [37]:
# Will need to modify the parameters and the network depending on what you are experimenting with

C, H, W = 3, 32, 32
num_classes = 10

channel_1 = 32
channel_2 = 64
channel_3 = 128
pool_kernel_size = 2

kernel_size_1 = 3
kernel_size_2 = 5
kernel_size_3 = 7

pad_size_1 = 2
pad_size_2 = 3
pad_size_3 = 3

fc_count_1 = 1024

class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.conv1 = nn.Conv2d(3, channel_1, kernel_size_1, padding=pad_size_1)
        self.norm1 = nn.BatchNorm2d(channel_1)
        self.pool1 = nn.MaxPool2d(pool_kernel_size)
        self.conv2 = nn.Conv2d(channel_1, channel_2, kernel_size_2, padding=pad_size_2)
        self.norm2 = nn.BatchNorm2d(channel_2)
        self.pool2 = nn.MaxPool2d(pool_kernel_size)
        self.conv3 = nn.Conv2d(channel_2, channel_3, kernel_size_3, padding=pad_size_3)
        self.norm3 = nn.BatchNorm2d(channel_3)
        self.pool3 = nn.MaxPool2d(pool_kernel_size)        

        H_after_conv1 = int(H + 2*pad_size_1 - 1*(kernel_size_1-1) - 1 + 1)
        W_after_conv1 = int(W + 2*pad_size_1 - 1*(kernel_size_1-1) - 1 + 1)
        H_after_pool1 = int((H_after_conv1 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)
        W_after_pool1 = int((W_after_conv1 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)
        H_after_conv2 = int(H_after_pool1 + 2*pad_size_2 - 1*(kernel_size_2-1) - 1 + 1)
        W_after_conv2 = int(W_after_pool1 + 2*pad_size_2 - 1*(kernel_size_2-1) - 1 + 1)
        H_after_pool2 = int((H_after_conv2 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)
        W_after_pool2 = int((W_after_conv2 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)  
        H_after_conv3 = int(H_after_pool2 + 2*pad_size_3 - 1*(kernel_size_3-1) - 1 + 1)
        W_after_conv3 = int(W_after_pool2 + 2*pad_size_3 - 1*(kernel_size_3-1) - 1 + 1)
        H_after_pool3 = int((H_after_conv3 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)
        W_after_pool3 = int((W_after_conv3 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)

        self.fc1 = nn.Linear(H_after_pool3*W_after_pool3*channel_3, fc_count_1)
        self.fc2 = nn.Linear(fc_count_1, fc_count_1)
        self.fc3 = nn.Linear(fc_count_1, 10)


    def forward(self, x):
        x = self.conv1(x)
        x = self.norm1(x)
        x = F.relu(x)
        x = self.pool1(x)
        x = self.conv2(x)
        x = self.norm2(x)
        x = F.relu(x)
        x = self.pool2(x)
        x = self.conv3(x)
        x = self.norm3(x)
        x = F.relu(x)
        x = self.pool3(x)
        x = flatten(x)
        x = self.fc1(x)
        #x = F.relu(x)
        x = self.fc2(x)
        #x = F.relu(x)
        x = self.fc3(x)

        return x



## The train function


In [38]:
def train_cifar(config):
    net = Net()  # Will need to modify the parameters depending on what you are experimenting with

    learning_rate = config['learning_rate']
    momentum = 0.5
    weight_decay = 1e-4

    device = "cpu"
    if torch.cuda.is_available():
        device = "cuda:0"
        if torch.cuda.device_count() > 1:
            net = nn.DataParallel(net)
    net.to(device)

    

    criterion = nn.CrossEntropyLoss()

    if config['opt'] == 'sgd':
      optimizer = optim.SGD(net.parameters(), lr=learning_rate, 
                        weight_decay=weight_decay,
                        momentum=0, nesterov=False)
    
    elif config['opt'] == 'sgd_nes':
      optimizer = optim.SGD(net.parameters(), lr=learning_rate, 
                  weight_decay=weight_decay,
                  momentum=0, nesterov=False)
      
    elif config['opt'] == 'adagrad':
      optimizer = optim.Adagrad(net.parameters(), lr=learning_rate, 
                      weight_decay=weight_decay)
      
    elif config['opt'] == 'rms':
      optimizer = optim.RMSprop(net.parameters(), lr=learning_rate, 
                      weight_decay=weight_decay, momentum=momentum)
      
    elif config['opt'] == 'adam':
      optimizer = optim.Adam(net.parameters(), lr=learning_rate, 
                      weight_decay=weight_decay)

    #optimizer = optim.SGD(net.parameters(), lr=1e-2)

    # Do not modify any code below!
    loaded_checkpoint = session.get_checkpoint()
    if loaded_checkpoint:
        with loaded_checkpoint.as_directory() as loaded_checkpoint_dir:
            model_state, optimizer_state = torch.load(
                os.path.join(loaded_checkpoint_dir, "checkpoint.pt")
            )
            net.load_state_dict(model_state)
            optimizer.load_state_dict(optimizer_state)

    data_dir = os.path.abspath("./data")
    trainset, testset = load_data(data_dir)

    test_abs = int(len(trainset) * 0.8)
    train_subset, val_subset = random_split(
        trainset, [test_abs, len(trainset) - test_abs]
    )

    trainloader = torch.utils.data.DataLoader(
        train_subset, batch_size=64, shuffle=True, num_workers=8
    )
    valloader = torch.utils.data.DataLoader(
        val_subset, batch_size=64, shuffle=True, num_workers=8
    )

    for epoch in range(10):
        running_loss = 0.0
        epoch_steps = 0
        for i, data in enumerate(trainloader, 0):
            inputs, labels = data
            inputs, labels = inputs.to(device), labels.to(device)

            optimizer.zero_grad()

            outputs = net(inputs)
            loss = criterion(outputs, labels)
            loss.backward()
            optimizer.step()

            running_loss += loss.item()
            epoch_steps += 1
            if i % 2000 == 1999:
                print(
                    f"[{epoch + 1}, {i + 1:>5} loss: {running_loss / epoch_steps:.3f}]"
                )
                running_loss = 0.0

        val_loss = 0.0
        val_steps = 0
        total = 0
        correct = 0
        for i, data in enumerate(valloader, 0):
            with torch.no_grad():
                inputs, labels = data
                inputs, labels = inputs.to(device), labels.to(device)

                outputs = net(inputs)
                _, predicted = torch.max(outputs.data, 1)
                total += labels.size(0)
                correct += (predicted == labels).sum().item()

                loss = criterion(outputs, labels)
                val_loss += loss.cpu().numpy()
                val_steps += 1

        os.makedirs("my_model", exist_ok=True)
        torch.save((net.state_dict(), optimizer.state_dict()), "my_model/checkpoint.pt")
        checkpoint = Checkpoint.from_directory("my_model")
        session.report(
            {"loss": (val_loss / val_steps), "accuracy": correct / total},
            checkpoint=checkpoint,
        )
    print("Finished Training")


## Test set accuracy


In [39]:
def test_best_model(best_result):
    best_trained_model = Net(
     )  # Will need to modify the parameters depending on what you are experimenting with

    # Do not modify any code below!
    device = "cuda:0" if torch.cuda.is_available() else "cpu"
    best_trained_model.to(device)

    checkpoint_path = os.path.join(
        best_result.checkpoint.to_directory(), "checkpoint.pt"
    )

    model_state, optimizer_state = torch.load(checkpoint_path)
    best_trained_model.load_state_dict(model_state)

    trainset, testset = load_data()

    testloader = torch.utils.data.DataLoader(
        testset, batch_size=4, shuffle=False, num_workers=2
    )

    correct = 0
    total = 0
    with torch.no_grad():
        for data in testloader:
            images, labels = data
            images, labels = images.to(device), labels.to(device)
            outputs = best_trained_model(images)
            _, predicted = torch.max(outputs.data, 1)
            total += labels.size(0)
            correct += (predicted == labels).sum().item()

    print(f"Best trial test set accuracy: {correct / total}")


## Configuring the search space


In [40]:
# You will be experimenting with the hyperparameters here
# Use tune.grid_search to specify what values you want to experiment with a hyperparameter
config = {"opt": tune.grid_search(['sgd', 'sgd_nes', 'adagrad', 'rms', 'adam']), 
          "learning_rate": tune.grid_search([6e-2, 4e-2, 2e-2, 1e-2, 5e-3])}



In [41]:
# Do not modify any code below!
def main(config):
    tuner = tune.Tuner(
        tune.with_resources(
            tune.with_parameters(train_cifar),
            resources={"gpu": 1},
        ),
        param_space=config,
    )
    results = tuner.fit()

    best_result = results.get_best_result("accuracy", "max")

    print(f"Best trial config: {best_result.config}")
    print(f"Best trial final validation loss: {best_result.metrics['loss']}")
    print(f"Best trial final validation accuracy: {best_result.metrics['accuracy']}")

    test_best_model(best_result)

    return results.get_dataframe("accuracy", "max")


results_df = main(config)


0,1
Current time:,2023-04-12 08:15:54
Running for:,00:29:06.46
Memory:,9.1/83.5 GiB

Trial name,status,loc,learning_rate,opt,iter,total time (s),loss,accuracy
train_cifar_2dffa_00000,TERMINATED,172.28.0.12:112437,0.06,sgd,10,70.9051,0.937693,0.7525
train_cifar_2dffa_00001,TERMINATED,172.28.0.12:112437,0.04,sgd,10,67.5219,0.861384,0.7679
train_cifar_2dffa_00002,TERMINATED,172.28.0.12:112437,0.02,sgd,10,66.8174,0.859859,0.7536
train_cifar_2dffa_00003,TERMINATED,172.28.0.12:112437,0.01,sgd,10,66.5761,0.830985,0.735
train_cifar_2dffa_00004,TERMINATED,172.28.0.12:112437,0.005,sgd,10,66.9281,0.815518,0.7241
train_cifar_2dffa_00005,TERMINATED,172.28.0.12:112437,0.06,sgd_nes,10,65.6858,0.922352,0.7646
train_cifar_2dffa_00006,TERMINATED,172.28.0.12:112437,0.04,sgd_nes,10,66.1114,0.930633,0.7468
train_cifar_2dffa_00007,TERMINATED,172.28.0.12:112437,0.02,sgd_nes,10,70.0672,1.04738,0.7096
train_cifar_2dffa_00008,TERMINATED,172.28.0.12:112437,0.01,sgd_nes,10,65.3148,0.813094,0.7388
train_cifar_2dffa_00009,TERMINATED,172.28.0.12:112437,0.005,sgd_nes,10,67.5177,0.83487,0.728


[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00000_0_learning_rate=0.0600,opt=sgd_2023-04-12_07-46-48/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:07, 156707.38it/s]
  0%|          | 65536/170498071 [00:00<18:03, 157263.77it/s]
  0%|          | 98304/170498071 [00:00<18:02, 157411.65it/s]
  0%|          | 229376/170498071 [00:00<08:16, 343010.93it/s]
  0%|          | 458752/170498071 [00:01<04:36, 615531.35it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1152913.31it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2212238.73it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4340241.19it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7633656.65it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9909368.50it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11434018.66it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12513784.08it/s]
 11%|█▏        | 19333120/170498071 [00:02<00:11, 13266441.10it/s]
 13%|█▎        | 22478848/170498071 [00:02<00:10, 13771285.03it/s]
 15%|█▌        | 25624576/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00000_0_learning_rate=0.0600,opt=sgd_2023-04-12_07-46-48/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00000_0_learning_rate=0.0600,opt=sgd_2023-04-12_07-46-48/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified


Trial name,accuracy,date,done,episodes_total,experiment_id,experiment_tag,hostname,iterations_since_restore,loss,node_ip,pid,should_checkpoint,time_since_restore,time_this_iter_s,time_total_s,timestamp,timesteps_since_restore,timesteps_total,training_iteration,trial_id,warmup_time
train_cifar_2dffa_00000,0.7525,2023-04-12_07-48-02,True,,9df85343eca142f69857be6fefe122b4,"0_learning_rate=0.0600,opt=sgd",ec71ef1e9740,10,0.937693,172.28.0.12,112437,True,70.9051,4.91554,70.9051,1681285682,0,,10,2dffa_00000,0.00400162
train_cifar_2dffa_00001,0.7679,2023-04-12_07-49-10,True,,9df85343eca142f69857be6fefe122b4,"1_learning_rate=0.0400,opt=sgd",ec71ef1e9740,10,0.861384,172.28.0.12,112437,True,67.5219,4.95054,67.5219,1681285750,0,,10,2dffa_00001,0.00400162
train_cifar_2dffa_00002,0.7536,2023-04-12_07-50-17,True,,9df85343eca142f69857be6fefe122b4,"2_learning_rate=0.0200,opt=sgd",ec71ef1e9740,10,0.859859,172.28.0.12,112437,True,66.8174,4.82784,66.8174,1681285817,0,,10,2dffa_00002,0.00400162
train_cifar_2dffa_00003,0.735,2023-04-12_07-51-23,True,,9df85343eca142f69857be6fefe122b4,"3_learning_rate=0.0100,opt=sgd",ec71ef1e9740,10,0.830985,172.28.0.12,112437,True,66.5761,4.79484,66.5761,1681285883,0,,10,2dffa_00003,0.00400162
train_cifar_2dffa_00004,0.7241,2023-04-12_07-52-30,True,,9df85343eca142f69857be6fefe122b4,"4_learning_rate=0.0050,opt=sgd",ec71ef1e9740,10,0.815518,172.28.0.12,112437,True,66.9281,4.68343,66.9281,1681285950,0,,10,2dffa_00004,0.00400162
train_cifar_2dffa_00005,0.7646,2023-04-12_07-53-36,True,,9df85343eca142f69857be6fefe122b4,"5_learning_rate=0.0600,opt=sgd_nes",ec71ef1e9740,10,0.922352,172.28.0.12,112437,True,65.6858,4.66239,65.6858,1681286016,0,,10,2dffa_00005,0.00400162
train_cifar_2dffa_00006,0.7468,2023-04-12_07-54-42,True,,9df85343eca142f69857be6fefe122b4,"6_learning_rate=0.0400,opt=sgd_nes",ec71ef1e9740,10,0.930633,172.28.0.12,112437,True,66.1114,4.75691,66.1114,1681286082,0,,10,2dffa_00006,0.00400162
train_cifar_2dffa_00007,0.7096,2023-04-12_07-55-52,True,,9df85343eca142f69857be6fefe122b4,"7_learning_rate=0.0200,opt=sgd_nes",ec71ef1e9740,10,1.04738,172.28.0.12,112437,True,70.0672,4.77523,70.0672,1681286152,0,,10,2dffa_00007,0.00400162
train_cifar_2dffa_00008,0.7388,2023-04-12_07-56-57,True,,9df85343eca142f69857be6fefe122b4,"8_learning_rate=0.0100,opt=sgd_nes",ec71ef1e9740,10,0.813094,172.28.0.12,112437,True,65.3148,4.75657,65.3148,1681286217,0,,10,2dffa_00008,0.00400162
train_cifar_2dffa_00009,0.728,2023-04-12_07-58-05,True,,9df85343eca142f69857be6fefe122b4,"9_learning_rate=0.0050,opt=sgd_nes",ec71ef1e9740,10,0.83487,172.28.0.12,112437,True,67.5177,4.83101,67.5177,1681286285,0,,10,2dffa_00009,0.00400162


[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00001_1_learning_rate=0.0400,opt=sgd_2023-04-12_07-48-02/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:04, 157123.91it/s]
  0%|          | 65536/170498071 [00:00<18:03, 157232.71it/s]
  0%|          | 98304/170498071 [00:00<18:01, 157526.29it/s]
  0%|          | 229376/170498071 [00:00<08:15, 343460.69it/s]
  0%|          | 458752/170498071 [00:01<04:35, 616591.98it/s]
  1%|          | 917504/170498071 [00:01<02:26, 1155706.41it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2217965.72it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4364035.72it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7673758.37it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9950207.83it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11491956.42it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12550703.73it/s]
 11%|█▏        | 19333120/170498071 [00:02<00:11, 13308795.67it/s]
 13%|█▎        | 22478848/170498071 [00:02<00:10, 13826164.18it/s]
 15%|█▌        | 25591808/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00001_1_learning_rate=0.0400,opt=sgd_2023-04-12_07-48-02/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00001_1_learning_rate=0.0400,opt=sgd_2023-04-12_07-48-02/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00002_2_learning_rate=0.0200,opt=sgd_2023-04-12_07-49-10/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:39, 152328.62it/s]
  0%|          | 65536/170498071 [00:00<18:28, 153721.38it/s]
  0%|          | 98304/170498071 [00:00<18:07, 156727.11it/s]
  0%|          | 229376/170498071 [00:00<08:22, 338533.59it/s]
  0%|          | 458752/170498071 [00:01<04:39, 607836.43it/s]
  0%|          | 819200/170498071 [00:01<02:23, 1185965.48it/s]
  1%|          | 983040/170498071 [00:01<02:16, 1245980.24it/s]
  1%|          | 1605632/170498071 [00:01<01:10, 2398255.51it/s]
  1%|          | 1933312/170498071 [00:01<01:05, 2569152.14it/s]
  2%|▏         | 3080192/170498071 [00:01<00:34, 4849487.88it/s]
  2%|▏         | 3702784/170498071 [00:01<00:31, 5215306.33it/s]
  3%|▎         | 5799936/170498071 [00:01<00:17, 9580885.39it/s]
  4%|▍         | 6848512/170498071 [00:01<00:18, 8984852.74it/s]
  5%|▌         | 9207808/170498071 [00:02<00:12, 12900604.48it/s]
  6%|▌         | 10616832/170498071 [00:02<00:13, 11608485

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00002_2_learning_rate=0.0200,opt=sgd_2023-04-12_07-49-10/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00002_2_learning_rate=0.0200,opt=sgd_2023-04-12_07-49-10/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00003_3_learning_rate=0.0100,opt=sgd_2023-04-12_07-50-17/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:21, 154798.70it/s]
  0%|          | 65536/170498071 [00:00<18:14, 155786.14it/s]
  0%|          | 98304/170498071 [00:00<18:05, 156908.44it/s]
  0%|          | 229376/170498071 [00:00<08:17, 342123.20it/s]
  0%|          | 458752/170498071 [00:01<04:37, 613431.47it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1149792.97it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2205835.33it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4340532.55it/s]
  4%|▍         | 6455296/170498071 [00:01<00:23, 7077248.42it/s]
  6%|▌         | 9568256/170498071 [00:02<00:16, 9477550.69it/s]
  7%|▋         | 12713984/170498071 [00:02<00:14, 11099811.91it/s]
  9%|▉         | 15826944/170498071 [00:02<00:12, 12309957.63it/s]
 11%|█         | 18972672/170498071 [00:02<00:11, 12971064.84it/s]
 13%|█▎        | 22085632/170498071 [00:02<00:10, 13615090.16it/s]
 15%|█▍        | 25231360/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00003_3_learning_rate=0.0100,opt=sgd_2023-04-12_07-50-17/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00003_3_learning_rate=0.0100,opt=sgd_2023-04-12_07-50-17/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00004_4_learning_rate=0.0050,opt=sgd_2023-04-12_07-51-23/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:02, 157439.07it/s]
  0%|          | 65536/170498071 [00:00<18:02, 157455.73it/s]
  0%|          | 98304/170498071 [00:00<18:00, 157663.29it/s]
  0%|          | 229376/170498071 [00:00<08:15, 343399.76it/s]
  0%|          | 458752/170498071 [00:01<04:35, 617205.98it/s]
  1%|          | 917504/170498071 [00:01<02:26, 1156330.34it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2217882.49it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4365798.63it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7667919.89it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9952951.83it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11498378.15it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12557996.28it/s]
 11%|█▏        | 19365888/170498071 [00:02<00:11, 13306546.09it/s]
 13%|█▎        | 22478848/170498071 [00:02<00:10, 13834581.78it/s]
 15%|█▌        | 25624576/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00004_4_learning_rate=0.0050,opt=sgd_2023-04-12_07-51-23/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00004_4_learning_rate=0.0050,opt=sgd_2023-04-12_07-51-23/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00005_5_learning_rate=0.0600,opt=sgd_nes_2023-04-12_07-52-30/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:08, 156569.21it/s]
  0%|          | 65536/170498071 [00:00<18:07, 156783.53it/s]
  0%|          | 98304/170498071 [00:00<18:12, 155942.97it/s]
  0%|          | 229376/170498071 [00:00<08:24, 337430.73it/s]
  0%|          | 458752/170498071 [00:01<04:38, 610501.07it/s]
  0%|          | 819200/170498071 [00:01<02:21, 1195048.83it/s]
  1%|          | 983040/170498071 [00:01<02:17, 1228771.57it/s]
  1%|          | 1769472/170498071 [00:01<01:02, 2721308.19it/s]
  1%|          | 2129920/170498071 [00:01<01:00, 2774159.42it/s]
  2%|▏         | 3670016/170498071 [00:01<00:33, 4953366.01it/s]
  3%|▎         | 5898240/170498071 [00:01<00:18, 8917268.24it/s]
  4%|▍         | 6946816/170498071 [00:01<00:19, 8560473.04it/s]
  6%|▌         | 9437184/170498071 [00:02<00:16, 9995490.92it/s]
  7%|▋         | 11927552/170498071 [00:02<00:12, 13187023.67it/s]
  8%|▊         | 13402112/170498071 [00:02<00:13, 1202808

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00005_5_learning_rate=0.0600,opt=sgd_nes_2023-04-12_07-52-30/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00005_5_learning_rate=0.0600,opt=sgd_nes_2023-04-12_07-52-30/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00006_6_learning_rate=0.0400,opt=sgd_nes_2023-04-12_07-53-36/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:08, 156584.72it/s]
  0%|          | 65536/170498071 [00:00<18:09, 156374.60it/s]
  0%|          | 98304/170498071 [00:00<18:04, 157113.76it/s]
  0%|          | 229376/170498071 [00:00<08:17, 342513.17it/s]
  0%|          | 458752/170498071 [00:01<04:36, 614348.28it/s]
  1%|          | 917504/170498071 [00:01<02:28, 1145323.80it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2206106.98it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4328132.83it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7613796.43it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9865970.34it/s]
  8%|▊         | 13008896/170498071 [00:02<00:11, 13385506.52it/s]
  9%|▊         | 14614528/170498071 [00:02<00:12, 12269619.28it/s]
  9%|▉         | 16187392/170498071 [00:02<00:13, 11853093.31it/s]
 11%|█         | 18317312/170498071 [00:02<00:11, 13798081.71it/s]
 12%|█▏        | 19890176/170498071 [00:02<00:12, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00006_6_learning_rate=0.0400,opt=sgd_nes_2023-04-12_07-53-36/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00006_6_learning_rate=0.0400,opt=sgd_nes_2023-04-12_07-53-36/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00007_7_learning_rate=0.0200,opt=sgd_nes_2023-04-12_07-54-42/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:35, 152850.40it/s]
  0%|          | 65536/170498071 [00:00<18:23, 154417.62it/s]
  0%|          | 98304/170498071 [00:00<18:03, 157306.22it/s]
  0%|          | 229376/170498071 [00:00<08:20, 340113.87it/s]
  0%|          | 458752/170498071 [00:01<04:38, 611561.20it/s]
  0%|          | 851968/170498071 [00:01<02:15, 1253135.82it/s]
  1%|          | 1048576/170498071 [00:01<02:07, 1327511.23it/s]
  1%|          | 1769472/170498071 [00:01<01:03, 2656104.14it/s]
  1%|          | 2129920/170498071 [00:01<01:04, 2593575.20it/s]
  2%|▏         | 2686976/170498071 [00:01<00:51, 3277586.93it/s]
  2%|▏         | 3080192/170498071 [00:01<00:50, 3321237.79it/s]
  2%|▏         | 3670016/170498071 [00:01<00:46, 3611873.24it/s]
  2%|▏         | 4259840/170498071 [00:01<00:40, 4135006.82it/s]
  3%|▎         | 4718592/170498071 [00:02<00:40, 4104627.13it/s]
  3%|▎         | 5308416/170498071 [00:02<00:36, 4567071.8

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00007_7_learning_rate=0.0200,opt=sgd_nes_2023-04-12_07-54-42/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00007_7_learning_rate=0.0200,opt=sgd_nes_2023-04-12_07-54-42/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00008_8_learning_rate=0.0100,opt=sgd_nes_2023-04-12_07-55-52/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:42, 151929.37it/s]
  0%|          | 65536/170498071 [00:00<18:09, 156473.10it/s]
  0%|          | 98304/170498071 [00:00<17:57, 158071.49it/s]
  0%|          | 229376/170498071 [00:00<08:15, 343850.83it/s]
  0%|          | 458752/170498071 [00:01<04:35, 616515.04it/s]
  1%|          | 917504/170498071 [00:01<02:26, 1155680.46it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2214005.39it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4356754.19it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7654679.08it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9895888.20it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11454241.88it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12481096.80it/s]
 11%|█▏        | 19333120/170498071 [00:02<00:11, 13290082.93it/s]
 13%|█▎        | 22446080/170498071 [00:02<00:10, 13812447.45it/s]
 15%|█▍        | 25395200/170498071 [00:03<00:08, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00008_8_learning_rate=0.0100,opt=sgd_nes_2023-04-12_07-55-52/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00008_8_learning_rate=0.0100,opt=sgd_nes_2023-04-12_07-55-52/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00009_9_learning_rate=0.0050,opt=sgd_nes_2023-04-12_07-56-57/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:11, 156110.20it/s]
  0%|          | 65536/170498071 [00:00<18:08, 156516.48it/s]
  0%|          | 98304/170498071 [00:00<18:07, 156740.03it/s]
  0%|          | 229376/170498071 [00:00<08:18, 341742.08it/s]
  0%|          | 458752/170498071 [00:01<04:37, 613281.38it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1149369.25it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2204746.04it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4336479.49it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7626637.48it/s]
  6%|▌         | 9928704/170498071 [00:02<00:16, 9854975.59it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11407739.68it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12489744.15it/s]
 11%|█▏        | 19333120/170498071 [00:02<00:11, 13216503.87it/s]
 13%|█▎        | 22478848/170498071 [00:02<00:10, 13706649.73it/s]
 15%|█▌        | 25624576/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00009_9_learning_rate=0.0050,opt=sgd_nes_2023-04-12_07-56-57/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00009_9_learning_rate=0.0050,opt=sgd_nes_2023-04-12_07-56-57/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00010_10_learning_rate=0.0600,opt=adagrad_2023-04-12_07-58-05/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:53, 150371.18it/s]
  0%|          | 65536/170498071 [00:00<18:30, 153540.31it/s]
  0%|          | 98304/170498071 [00:00<18:05, 157049.49it/s]
  0%|          | 229376/170498071 [00:00<08:17, 342502.41it/s]
  0%|          | 458752/170498071 [00:01<04:38, 610751.82it/s]
  0%|          | 851968/170498071 [00:01<02:14, 1258111.36it/s]
  1%|          | 1048576/170498071 [00:01<02:09, 1309391.70it/s]
  1%|          | 1703936/170498071 [00:01<01:08, 2471263.08it/s]
  1%|          | 2064384/170498071 [00:01<01:01, 2735264.97it/s]
  2%|▏         | 3211264/170498071 [00:01<00:33, 4958841.19it/s]
  2%|▏         | 3801088/170498071 [00:01<00:34, 4857364.63it/s]
  3%|▎         | 4718592/170498071 [00:01<00:27, 5986521.23it/s]
  3%|▎         | 5406720/170498071 [00:01<00:26, 6123803.46it/s]
  4%|▎         | 6356992/170498071 [00:02<00:23, 7041353.12it/s]
  4%|▍         | 7110656/170498071 [00:02<00:23, 7023189.8

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00010_10_learning_rate=0.0600,opt=adagrad_2023-04-12_07-58-05/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00010_10_learning_rate=0.0600,opt=adagrad_2023-04-12_07-58-05/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00011_11_learning_rate=0.0400,opt=adagrad_2023-04-12_07-59-20/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:03, 157338.68it/s]
  0%|          | 65536/170498071 [00:00<18:03, 157301.92it/s]
  0%|          | 98304/170498071 [00:00<18:03, 157285.65it/s]
  0%|          | 229376/170498071 [00:00<08:15, 343461.41it/s]
  0%|          | 458752/170498071 [00:01<04:36, 616048.34it/s]
  1%|          | 917504/170498071 [00:01<02:26, 1155000.34it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2215333.17it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4353142.90it/s]
  4%|▍         | 6717440/170498071 [00:01<00:22, 7409877.20it/s]
  6%|▌         | 9764864/170498071 [00:02<00:16, 9560779.29it/s]
  8%|▊         | 12910592/170498071 [00:02<00:14, 11197093.12it/s]
  9%|▉         | 16056320/170498071 [00:02<00:12, 12200496.92it/s]
 11%|█         | 19038208/170498071 [00:02<00:11, 12767821.76it/s]
 13%|█▎        | 22183936/170498071 [00:02<00:11, 13365317.70it/s]
 15%|█▍        | 25329664/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00011_11_learning_rate=0.0400,opt=adagrad_2023-04-12_07-59-20/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00011_11_learning_rate=0.0400,opt=adagrad_2023-04-12_07-59-20/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00012_12_learning_rate=0.0200,opt=adagrad_2023-04-12_08-00-34/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:07, 156768.51it/s]
  0%|          | 65536/170498071 [00:00<18:07, 156734.12it/s]
  0%|          | 98304/170498071 [00:00<18:05, 156944.59it/s]
  0%|          | 229376/170498071 [00:00<08:17, 342336.25it/s]
  0%|          | 458752/170498071 [00:01<04:36, 613888.16it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1151718.82it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2210141.61it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4348204.37it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7644520.80it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9913188.07it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11346604.67it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12384900.79it/s]
 11%|█▏        | 19365888/170498071 [00:02<00:11, 12924831.78it/s]
 13%|█▎        | 22478848/170498071 [00:02<00:10, 13862459.96it/s]
 15%|█▍        | 25559040/170498071 [00:03<00:08, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00012_12_learning_rate=0.0200,opt=adagrad_2023-04-12_08-00-34/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00012_12_learning_rate=0.0200,opt=adagrad_2023-04-12_08-00-34/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00013_13_learning_rate=0.0100,opt=adagrad_2023-04-12_08-01-48/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:03, 157369.48it/s]
  0%|          | 65536/170498071 [00:00<18:03, 157304.75it/s]
  0%|          | 98304/170498071 [00:00<18:02, 157465.34it/s]
  0%|          | 229376/170498071 [00:00<08:15, 343301.02it/s]
  0%|          | 458752/170498071 [00:01<04:35, 616276.21it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1153603.36it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2214341.78it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4359709.85it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7661568.73it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9784309.95it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11341667.95it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12397518.95it/s]
 11%|█▏        | 19333120/170498071 [00:02<00:11, 13447178.97it/s]
 13%|█▎        | 22446080/170498071 [00:02<00:10, 13902290.93it/s]
 15%|█▌        | 25591808/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00013_13_learning_rate=0.0100,opt=adagrad_2023-04-12_08-01-48/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00013_13_learning_rate=0.0100,opt=adagrad_2023-04-12_08-01-48/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00014_14_learning_rate=0.0050,opt=adagrad_2023-04-12_08-03-01/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:04, 157121.03it/s]
  0%|          | 65536/170498071 [00:00<18:16, 155493.99it/s]
  0%|          | 98304/170498071 [00:00<18:04, 157118.57it/s]
  0%|          | 229376/170498071 [00:00<08:17, 342485.58it/s]
  0%|          | 458752/170498071 [00:01<04:36, 614475.29it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1152628.87it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2210883.81it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4341660.50it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7646285.31it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9909576.90it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11457606.97it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12502905.33it/s]
 11%|█▏        | 19333120/170498071 [00:02<00:11, 13274204.42it/s]
 13%|█▎        | 22478848/170498071 [00:02<00:10, 13775149.70it/s]
 15%|█▌        | 25624576/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00014_14_learning_rate=0.0050,opt=adagrad_2023-04-12_08-03-01/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00014_14_learning_rate=0.0050,opt=adagrad_2023-04-12_08-03-01/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00015_15_learning_rate=0.0600,opt=rms_2023-04-12_08-04-14/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:18, 155200.05it/s]
  0%|          | 65536/170498071 [00:00<18:04, 157140.17it/s]
  0%|          | 98304/170498071 [00:00<18:04, 157192.16it/s]
  0%|          | 229376/170498071 [00:00<08:16, 342646.03it/s]
  0%|          | 458752/170498071 [00:01<04:36, 614795.28it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1152201.45it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2210145.88it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4348817.62it/s]
  4%|▍         | 6488064/170498071 [00:01<00:22, 7135353.12it/s]
  6%|▌         | 9633792/170498071 [00:02<00:16, 9512447.06it/s]
  7%|▋         | 12713984/170498071 [00:02<00:14, 11027009.11it/s]
  9%|▉         | 15794176/170498071 [00:02<00:12, 12065619.01it/s]
 11%|█         | 18907136/170498071 [00:02<00:11, 12902088.51it/s]
 13%|█▎        | 22052864/170498071 [00:02<00:10, 13531882.31it/s]
 15%|█▍        | 25165824/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00015_15_learning_rate=0.0600,opt=rms_2023-04-12_08-04-14/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00015_15_learning_rate=0.0600,opt=rms_2023-04-12_08-04-14/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00016_16_learning_rate=0.0400,opt=rms_2023-04-12_08-05-24/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<17:59, 157936.78it/s]
  0%|          | 65536/170498071 [00:00<18:01, 157604.28it/s]
  0%|          | 98304/170498071 [00:00<17:58, 157964.98it/s]
  0%|          | 229376/170498071 [00:00<08:14, 344079.43it/s]
  0%|          | 458752/170498071 [00:01<04:35, 618062.15it/s]
  1%|          | 917504/170498071 [00:01<02:26, 1158739.16it/s]
  1%|          | 1835008/170498071 [00:01<01:15, 2222380.23it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4372323.66it/s]
  4%|▍         | 6750208/170498071 [00:01<00:21, 7537777.09it/s]
  6%|▌         | 9797632/170498071 [00:02<00:16, 9661538.89it/s]
  8%|▊         | 12943360/170498071 [00:02<00:14, 11218738.31it/s]
  9%|▉         | 16056320/170498071 [00:02<00:12, 12336504.53it/s]
 11%|█         | 19136512/170498071 [00:02<00:11, 12913716.00it/s]
 13%|█▎        | 22085632/170498071 [00:02<00:11, 13205727.73it/s]
 15%|█▍        | 25100288/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00016_16_learning_rate=0.0400,opt=rms_2023-04-12_08-05-24/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00016_16_learning_rate=0.0400,opt=rms_2023-04-12_08-05-24/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00017_17_learning_rate=0.0200,opt=rms_2023-04-12_08-06-32/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:06, 156828.62it/s]
  0%|          | 65536/170498071 [00:00<18:07, 156749.50it/s]
  0%|          | 98304/170498071 [00:00<18:05, 156983.75it/s]
  0%|          | 229376/170498071 [00:00<08:17, 342287.53it/s]
  0%|          | 458752/170498071 [00:01<04:36, 614321.63it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1151416.28it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2208459.01it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4345551.64it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7634966.09it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9906939.98it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11451845.34it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12505607.29it/s]
 11%|█▏        | 19333120/170498071 [00:02<00:11, 13246394.93it/s]
 13%|█▎        | 22478848/170498071 [00:02<00:10, 13734483.73it/s]
 15%|█▌        | 25591808/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00017_17_learning_rate=0.0200,opt=rms_2023-04-12_08-06-32/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00017_17_learning_rate=0.0200,opt=rms_2023-04-12_08-06-32/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00018_18_learning_rate=0.0100,opt=rms_2023-04-12_08-07-39/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:01, 157683.64it/s]
  0%|          | 65536/170498071 [00:00<18:03, 157364.82it/s]
  0%|          | 98304/170498071 [00:00<18:02, 157463.85it/s]
  0%|          | 229376/170498071 [00:00<08:19, 340722.17it/s]
  0%|          | 458752/170498071 [00:01<04:37, 612785.55it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1153192.16it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2216941.77it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4363654.25it/s]
  4%|▎         | 6324224/170498071 [00:01<00:23, 6930396.96it/s]
  6%|▌         | 9404416/170498071 [00:02<00:17, 9266051.14it/s]
  7%|▋         | 12550144/170498071 [00:02<00:14, 11026435.09it/s]
  9%|▉         | 15630336/170498071 [00:02<00:12, 11994074.81it/s]
 11%|█         | 18776064/170498071 [00:02<00:11, 12903169.06it/s]
 13%|█▎        | 21889024/170498071 [00:02<00:11, 13502291.88it/s]
 15%|█▍        | 25001984/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00018_18_learning_rate=0.0100,opt=rms_2023-04-12_08-07-39/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00018_18_learning_rate=0.0100,opt=rms_2023-04-12_08-07-39/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00019_19_learning_rate=0.0050,opt=rms_2023-04-12_08-08-50/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:00, 157794.98it/s]
  0%|          | 65536/170498071 [00:00<18:00, 157671.03it/s]
  0%|          | 98304/170498071 [00:00<18:01, 157487.94it/s]
  0%|          | 229376/170498071 [00:00<08:15, 343832.97it/s]
  0%|          | 458752/170498071 [00:01<04:35, 617420.45it/s]
  1%|          | 917504/170498071 [00:01<02:26, 1157757.67it/s]
  1%|          | 1835008/170498071 [00:01<01:15, 2221398.17it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4372832.01it/s]
  4%|▍         | 6684672/170498071 [00:01<00:21, 7451326.30it/s]
  6%|▌         | 9797632/170498071 [00:02<00:16, 9696957.63it/s]
  8%|▊         | 12877824/170498071 [00:02<00:14, 11107000.92it/s]
  9%|▉         | 15859712/170498071 [00:02<00:12, 12030341.44it/s]
 11%|█         | 19005440/170498071 [00:02<00:11, 12941502.27it/s]
 13%|█▎        | 22020096/170498071 [00:02<00:11, 13223396.07it/s]
 15%|█▍        | 25034752/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00019_19_learning_rate=0.0050,opt=rms_2023-04-12_08-08-50/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00019_19_learning_rate=0.0050,opt=rms_2023-04-12_08-08-50/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00020_20_learning_rate=0.0600,opt=adam_2023-04-12_08-10-00/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:33, 153101.04it/s]
  0%|          | 65536/170498071 [00:00<18:24, 154289.78it/s]
  0%|          | 98304/170498071 [00:00<18:07, 156759.89it/s]
  0%|          | 229376/170498071 [00:00<08:16, 342632.74it/s]
  0%|          | 458752/170498071 [00:01<04:35, 616198.63it/s]
  1%|          | 917504/170498071 [00:01<02:26, 1154590.04it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2214964.20it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4358670.46it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7660425.25it/s]
  6%|▌         | 9928704/170498071 [00:02<00:16, 9761201.28it/s]
  8%|▊         | 13008896/170498071 [00:02<00:14, 11213442.84it/s]
  9%|▉         | 16089088/170498071 [00:02<00:12, 12209671.34it/s]
 11%|█▏        | 19202048/170498071 [00:02<00:11, 13025079.21it/s]
 13%|█▎        | 22347776/170498071 [00:02<00:11, 13456467.83it/s]
 15%|█▍        | 25460736/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00020_20_learning_rate=0.0600,opt=adam_2023-04-12_08-10-00/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00020_20_learning_rate=0.0600,opt=adam_2023-04-12_08-10-00/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00021_21_learning_rate=0.0400,opt=adam_2023-04-12_08-11-09/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:43, 151687.41it/s]
  0%|          | 65536/170498071 [00:00<18:28, 153701.48it/s]
  0%|          | 98304/170498071 [00:00<18:05, 156946.15it/s]
  0%|          | 229376/170498071 [00:00<08:16, 342819.96it/s]
  0%|          | 458752/170498071 [00:01<04:35, 616888.59it/s]
  1%|          | 917504/170498071 [00:01<02:26, 1155684.26it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2216801.53it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4359833.81it/s]
  4%|▍         | 6455296/170498071 [00:01<00:23, 7106348.61it/s]
  6%|▌         | 9568256/170498071 [00:02<00:16, 9512459.32it/s]
  7%|▋         | 12681216/170498071 [00:02<00:14, 11019721.12it/s]
  9%|▉         | 15761408/170498071 [00:02<00:12, 12072510.31it/s]
 11%|█         | 18874368/170498071 [00:02<00:11, 12926890.68it/s]
 13%|█▎        | 21921792/170498071 [00:02<00:11, 13283840.72it/s]
 15%|█▍        | 24936448/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00021_21_learning_rate=0.0400,opt=adam_2023-04-12_08-11-09/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00021_21_learning_rate=0.0400,opt=adam_2023-04-12_08-11-09/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00022_22_learning_rate=0.0200,opt=adam_2023-04-12_08-12-20/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:03, 157299.96it/s]
  0%|          | 65536/170498071 [00:00<18:05, 157003.36it/s]
  0%|          | 98304/170498071 [00:00<18:03, 157255.65it/s]
  0%|          | 229376/170498071 [00:00<08:16, 343058.00it/s]
  0%|          | 458752/170498071 [00:01<04:36, 615527.27it/s]
  1%|          | 917504/170498071 [00:01<02:26, 1154065.34it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2213776.51it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4356857.53it/s]
  4%|▍         | 6815744/170498071 [00:01<00:21, 7659845.71it/s]
  6%|▌         | 9961472/170498071 [00:02<00:16, 9932474.21it/s]
  8%|▊         | 13074432/170498071 [00:02<00:13, 11455954.65it/s]
 10%|▉         | 16220160/170498071 [00:02<00:12, 12534570.03it/s]
 11%|█▏        | 19365888/170498071 [00:02<00:11, 13280730.52it/s]
 13%|█▎        | 22478848/170498071 [00:02<00:10, 13773688.29it/s]
 15%|█▌        | 25624576/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00022_22_learning_rate=0.0200,opt=adam_2023-04-12_08-12-20/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00022_22_learning_rate=0.0200,opt=adam_2023-04-12_08-12-20/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00023_23_learning_rate=0.0100,opt=adam_2023-04-12_08-13-31/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:06, 156869.61it/s]
  0%|          | 65536/170498071 [00:00<18:03, 157329.63it/s]
  0%|          | 98304/170498071 [00:00<18:02, 157370.28it/s]
  0%|          | 229376/170498071 [00:00<08:16, 343112.63it/s]
  0%|          | 458752/170498071 [00:01<04:36, 614119.12it/s]
  1%|          | 917504/170498071 [00:01<02:27, 1151888.48it/s]
  1%|          | 1835008/170498071 [00:01<01:16, 2212354.76it/s]
  2%|▏         | 3702784/170498071 [00:01<00:38, 4353575.48it/s]
  4%|▍         | 6782976/170498071 [00:01<00:21, 7535885.87it/s]
  6%|▌         | 9830400/170498071 [00:02<00:16, 9647068.05it/s]
  8%|▊         | 12976128/170498071 [00:02<00:13, 11275957.00it/s]
  9%|▉         | 15958016/170498071 [00:02<00:12, 12022751.90it/s]
 11%|█         | 18972672/170498071 [00:02<00:11, 12673006.70it/s]
 13%|█▎        | 22020096/170498071 [00:02<00:11, 13179021.22it/s]
 15%|█▍        | 25100288/170498071 [00:03<00:10, 

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00023_23_learning_rate=0.0100,opt=adam_2023-04-12_08-13-31/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00023_23_learning_rate=0.0100,opt=adam_2023-04-12_08-13-31/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=112437)[0m Finished Training
[2m[36m(train_cifar pid=112437)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00024_24_learning_rate=0.0050,opt=adam_2023-04-12_08-14-42/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 32768/170498071 [00:00<18:31, 153431.76it/s]
  0%|          | 65536/170498071 [00:00<18:22, 154552.95it/s]
  0%|          | 98304/170498071 [00:00<18:02, 157423.58it/s]
  0%|          | 229376/170498071 [00:00<08:18, 341293.89it/s]
  0%|          | 458752/170498071 [00:01<04:37, 611904.36it/s]
  0%|          | 851968/170498071 [00:01<02:15, 1253427.34it/s]
  1%|          | 1048576/170498071 [00:01<02:07, 1333925.45it/s]
  1%|          | 1769472/170498071 [00:01<01:03, 2655426.03it/s]
  1%|          | 2129920/170498071 [00:01<01:04, 2591681.90it/s]
  2%|▏         | 2686976/170498071 [00:01<00:51, 3279952.47it/s]
  2%|▏         | 3080192/170498071 [00:01<00:50, 3337983.17it/s]
  2%|▏         | 3637248/170498071 [00:01<00:42, 3881748.43it/s]
  2%|▏         | 4063232/170498071 [00:01<00:42, 3877882.15it/s]
  3%|▎         | 4587520/170498071 [00:02<00:39, 4235508.12it/s]
  3%|▎         | 5079040/170498071 [00:02<00:37, 4359235.4

[2m[36m(train_cifar pid=112437)[0m Extracting /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00024_24_learning_rate=0.0050,opt=adam_2023-04-12_08-14-42/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-12_07-46-48/train_cifar_2dffa_00024_24_learning_rate=0.0050,opt=adam_2023-04-12_08-14-42/data
[2m[36m(train_cifar pid=112437)[0m Files already downloaded and verified


2023-04-12 08:15:54,784	INFO tune.py:798 -- Total run time: 1746.48 seconds (1746.45 seconds for the tuning loop).


[2m[36m(train_cifar pid=112437)[0m Finished Training
Best trial config: {'opt': 'sgd', 'learning_rate': 0.04}
Best trial final validation loss: 0.8613837703018431
Best trial final validation accuracy: 0.7679
Files already downloaded and verified
Files already downloaded and verified
Best trial test set accuracy: 0.7377


In [42]:
final_df = results_df.drop(
    columns=[
        "should_checkpoint",
        "timesteps_total",
        "episodes_total",
        "training_iteration",
        "trial_id",
        "experiment_id",
        "date",
        "timestamp",
        "pid",
        "hostname",
        "node_ip",
        "time_since_restore",
        "timesteps_since_restore",
        "iterations_since_restore",
        "warmup_time",
        "logdir",
    ]
)
final_df.sort_values(by=['accuracy'], ascending=False).head(10)

Unnamed: 0,loss,accuracy,time_this_iter_s,done,time_total_s,config/learning_rate,config/opt
1,0.861384,0.7679,4.950539,False,67.521874,0.04,sgd
5,0.922352,0.7646,4.662392,False,65.685817,0.06,sgd_nes
0,0.790352,0.7626,4.917248,False,61.076888,0.06,sgd
6,0.720641,0.759,4.804915,False,51.770998,0.04,sgd_nes
2,0.859859,0.7536,4.827842,False,66.81744,0.02,sgd
7,0.786104,0.7524,4.701315,False,65.291944,0.02,sgd_nes
3,0.753906,0.751,4.809244,False,61.781293,0.01,sgd
14,0.842639,0.7456,5.38312,False,73.301125,0.005,adagrad
24,0.807828,0.7394,5.030855,False,72.149987,0.005,adam
8,0.813094,0.7388,4.756567,False,65.314794,0.01,sgd_nes


In [43]:
final_df.sort_values(by=['accuracy']).head(10)

Unnamed: 0,loss,accuracy,time_this_iter_s,done,time_total_s,config/learning_rate,config/opt
16,95.911038,0.101,5.029337,False,58.150253,0.04,rms
20,2.563361,0.1019,5.126347,False,48.344251,0.06,adam
15,190.961538,0.104,4.946035,False,64.229026,0.06,rms
17,246.195076,0.1046,22.71291,False,22.71291,0.02,rms
18,2.329547,0.1048,4.909046,False,55.113385,0.01,rms
19,2.148173,0.1922,4.967229,False,50.002054,0.005,rms
10,2.058584,0.3446,5.63182,False,74.970793,0.06,adagrad
21,1.609014,0.4304,5.139658,False,71.336181,0.04,adam
11,1.390852,0.5015,5.671218,False,74.313518,0.04,adagrad
22,1.099801,0.6132,5.139256,False,65.543417,0.02,adam
