## Install Libraries


In [41]:
%pip install ray[tune]
# %pip install bayesian-optimization
#!pip install git+https://github.com/yfw/starter-code
%pip install ray[tune] bayesian-optimization==1.2.0
%pip install hyperopt
%pip install scikit-optimize
# %pip install torch torchvision torchaudio # Uncomment this to install PyTorch 2.0+ on ilab (required version to run this program)

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/


## Import Libraries


In [42]:
from filelock import FileLock
from ray import tune
from ray.air import session
from ray.air.checkpoint import Checkpoint
from torch.utils.data import random_split



import os
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms
from collections import OrderedDict

from ray.tune.schedulers import ASHAScheduler

from ray.tune.search import ConcurrencyLimiter
from ray.tune.search.bayesopt import BayesOptSearch

from hyperopt import hp
from ray.tune.search.hyperopt import HyperOptSearch
from ray.tune.search.skopt import SkOptSearch

## Data loaders


In [43]:
def load_data(data_dir="./data"):
    transform = transforms.Compose(
        [transforms.ToTensor(), transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))]
    )

    with FileLock(os.path.expanduser("~/.data.lock")):
        trainset = torchvision.datasets.CIFAR10(
            root=data_dir, train=True, download=True, transform=transform
        )

        testset = torchvision.datasets.CIFAR10(
            root=data_dir, train=False, download=True, transform=transform
        )

    return trainset, testset


## Configurable neural network


In [44]:
def flatten(x, start_dim=1, end_dim=-1):
    return x.flatten(start_dim=start_dim, end_dim=end_dim)


In [45]:
# Will need to modify the parameters and the network depending on what you are experimenting with

C, H, W = 3, 32, 32
num_classes = 10

channel_1 = 32
channel_2 = 64
channel_3 = 128
pool_kernel_size = 2

kernel_size_1 = 3
kernel_size_2 = 5
kernel_size_3 = 7

pad_size_1 = 2
pad_size_2 = 3
pad_size_3 = 3

fc_count_1 = 1024

class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.conv1 = nn.Conv2d(3, channel_1, kernel_size_1, padding=pad_size_1)
        self.norm1 = nn.BatchNorm2d(channel_1)
        self.pool1 = nn.MaxPool2d(pool_kernel_size)
        self.conv2 = nn.Conv2d(channel_1, channel_2, kernel_size_2, padding=pad_size_2)
        self.norm2 = nn.BatchNorm2d(channel_2)
        self.pool2 = nn.MaxPool2d(pool_kernel_size)
        self.conv3 = nn.Conv2d(channel_2, channel_3, kernel_size_3, padding=pad_size_3)
        self.norm3 = nn.BatchNorm2d(channel_3)
        self.pool3 = nn.MaxPool2d(pool_kernel_size)        

        H_after_conv1 = int(H + 2*pad_size_1 - 1*(kernel_size_1-1) - 1 + 1)
        W_after_conv1 = int(W + 2*pad_size_1 - 1*(kernel_size_1-1) - 1 + 1)
        H_after_pool1 = int((H_after_conv1 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)
        W_after_pool1 = int((W_after_conv1 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)
        H_after_conv2 = int(H_after_pool1 + 2*pad_size_2 - 1*(kernel_size_2-1) - 1 + 1)
        W_after_conv2 = int(W_after_pool1 + 2*pad_size_2 - 1*(kernel_size_2-1) - 1 + 1)
        H_after_pool2 = int((H_after_conv2 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)
        W_after_pool2 = int((W_after_conv2 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)  
        H_after_conv3 = int(H_after_pool2 + 2*pad_size_3 - 1*(kernel_size_3-1) - 1 + 1)
        W_after_conv3 = int(W_after_pool2 + 2*pad_size_3 - 1*(kernel_size_3-1) - 1 + 1)
        H_after_pool3 = int((H_after_conv3 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)
        W_after_pool3 = int((W_after_conv3 + 2*0 - 1*(pool_kernel_size-1) - 1) / pool_kernel_size + 1)

        self.fc1 = nn.Linear(H_after_pool3*W_after_pool3*channel_3, fc_count_1)
        self.fc2 = nn.Linear(fc_count_1, fc_count_1)
        self.fc3 = nn.Linear(fc_count_1, 10)


    def forward(self, x):
        x = self.conv1(x)
        x = self.norm1(x)
        x = F.relu(x)
        x = self.pool1(x)
        x = self.conv2(x)
        x = self.norm2(x)
        x = F.relu(x)
        x = self.pool2(x)
        x = self.conv3(x)
        x = self.norm3(x)
        x = F.relu(x)
        x = self.pool3(x)
        x = flatten(x)
        x = self.fc1(x)
        #x = F.relu(x)
        x = self.fc2(x)
        #x = F.relu(x)
        x = self.fc3(x)

        return x



## The train function


In [46]:
def train_cifar(config):
    net = Net()  # Will need to modify the parameters depending on what you are experimenting with

    learning_rate = config['learning_rate']
    momentum = config['momentum']
    weight_decay = 0.001

    device = "cpu"
    if torch.cuda.is_available():
        device = "cuda:0"
        if torch.cuda.device_count() > 1:
            net = nn.DataParallel(net)
    net.to(device)

    

    criterion = nn.CrossEntropyLoss()

    optimizer = optim.SGD(net.parameters(), lr=learning_rate, 
                weight_decay=weight_decay,
                momentum=momentum, nesterov=True)    




    # Do not modify any code below!
    loaded_checkpoint = session.get_checkpoint()
    if loaded_checkpoint:
        with loaded_checkpoint.as_directory() as loaded_checkpoint_dir:
            model_state, optimizer_state = torch.load(
                os.path.join(loaded_checkpoint_dir, "checkpoint.pt")
            )
            net.load_state_dict(model_state)
            optimizer.load_state_dict(optimizer_state)

    data_dir = os.path.abspath("./data")
    trainset, testset = load_data(data_dir)

    test_abs = int(len(trainset) * 0.8)
    train_subset, val_subset = random_split(
        trainset, [test_abs, len(trainset) - test_abs]
    )

    trainloader = torch.utils.data.DataLoader(
        train_subset, batch_size=64, shuffle=True, num_workers=8
    )
    valloader = torch.utils.data.DataLoader(
        val_subset, batch_size=64, shuffle=True, num_workers=8
    )

    for epoch in range(10):
        running_loss = 0.0
        epoch_steps = 0
        for i, data in enumerate(trainloader, 0):
            inputs, labels = data
            inputs, labels = inputs.to(device), labels.to(device)

            optimizer.zero_grad()

            outputs = net(inputs)
            loss = criterion(outputs, labels)
            loss.backward()
            optimizer.step()

            running_loss += loss.item()
            epoch_steps += 1
            if i % 2000 == 1999:
                print(
                    f"[{epoch + 1}, {i + 1:>5} loss: {running_loss / epoch_steps:.3f}]"
                )
                running_loss = 0.0

        val_loss = 0.0
        val_steps = 0
        total = 0
        correct = 0
        for i, data in enumerate(valloader, 0):
            with torch.no_grad():
                inputs, labels = data
                inputs, labels = inputs.to(device), labels.to(device)

                outputs = net(inputs)
                _, predicted = torch.max(outputs.data, 1)
                total += labels.size(0)
                correct += (predicted == labels).sum().item()

                loss = criterion(outputs, labels)
                val_loss += loss.cpu().numpy()
                val_steps += 1

        os.makedirs("my_model", exist_ok=True)
        torch.save((net.state_dict(), optimizer.state_dict()), "my_model/checkpoint.pt")
        checkpoint = Checkpoint.from_directory("my_model")
        session.report(
            {"loss": (val_loss / val_steps), "accuracy": correct / total},
            checkpoint=checkpoint,
        )
    print("Finished Training")


## Test set accuracy


In [47]:
def test_best_model(best_result):
    best_trained_model = Net(
     )  # Will need to modify the parameters depending on what you are experimenting with

    # Do not modify any code below!
    device = "cuda:0" if torch.cuda.is_available() else "cpu"
    best_trained_model.to(device)

    checkpoint_path = os.path.join(
        best_result.checkpoint.to_directory(), "checkpoint.pt"
    )

    model_state, optimizer_state = torch.load(checkpoint_path)
    best_trained_model.load_state_dict(model_state)

    trainset, testset = load_data()

    testloader = torch.utils.data.DataLoader(
        testset, batch_size=4, shuffle=False, num_workers=2
    )

    correct = 0
    total = 0
    with torch.no_grad():
        for data in testloader:
            images, labels = data
            images, labels = images.to(device), labels.to(device)
            outputs = best_trained_model(images)
            _, predicted = torch.max(outputs.data, 1)
            total += labels.size(0)
            correct += (predicted == labels).sum().item()

    print(f"Best trial test set accuracy: {correct / total}")


## Configuring the search space


In [48]:
# You will be experimenting with the hyperparameters here
# Use tune.grid_search to specify what values you want to experiment with a hyperparameter
config = { 
          "learning_rate": tune.uniform(1e-3, 1e-1),
          "momentum": tune.uniform(0.1, 0.9),
          }



In [49]:
# Do not modify any code below!
def main(config):

  #hyperopt_search = HyperOptSearch(config, metric="accuracy", mode="max")
  #algo = BayesOptSearch(utility_kwargs={"kind": "ucb", "kappa": 2.5, "xi": 0.0})
  #algo = ConcurrencyLimiter(algo, max_concurrent=4)

  current_best_params = [
    {
        "learning_rate": 0.053306,
        "momentum": 0.570568,
    },
    {
        "learning_rate": 0.028210,
        "momentum": 0.338465,
    },
    {
        "learning_rate": 0.013342,
        "momentum": 0.605203,
    }
  ]

  skopt_search = SkOptSearch(
    metric="accuracy",
    mode="max",
    points_to_evaluate=current_best_params)

  tuner = tune.Tuner(
    tune.with_resources(
      tune.with_parameters(train_cifar),
      resources={"gpu": 1},
    ),
    # tune_config=tune.TuneConfig(
    #   metric="accuracy",
    #   mode="max",
    #   search_alg=algo,
    # ),
    tune_config=tune.TuneConfig(
      num_samples = 30,
      search_alg=skopt_search,
    ),
      param_space=config,
    )
  results = tuner.fit()

  best_result = results.get_best_result("accuracy", "max")

  print(f"Best trial config: {best_result.config}")
  print(f"Best trial final validation loss: {best_result.metrics['loss']}")
  print(f"Best trial final validation accuracy: {best_result.metrics['accuracy']}")

  test_best_model(best_result)

  return results.get_dataframe("accuracy", "max")


results_df = main(config)


0,1
Current time:,2023-04-13 07:59:43
Running for:,00:30:35.48
Memory:,9.1/83.5 GiB

Trial name,status,loc,learning_rate,momentum,iter,total time (s),loss,accuracy
train_cifar_683fcf7c,TERMINATED,172.28.0.12:21616,0.053306,0.570568,10,63.2249,0.930889,0.7446
train_cifar_58540319,TERMINATED,172.28.0.12:21616,0.02821,0.338465,10,59.3073,0.95153,0.736
train_cifar_d060044d,TERMINATED,172.28.0.12:21616,0.013342,0.605203,10,59.8174,0.893706,0.7588
train_cifar_259d1be5,TERMINATED,172.28.0.12:21616,0.086741,0.624554,10,61.4143,,0.1011
train_cifar_055f429e,TERMINATED,172.28.0.12:21616,0.03469,0.503823,10,60.0488,0.842427,0.7594
train_cifar_c4b0e93b,TERMINATED,172.28.0.12:21616,0.0421257,0.16247,10,60.0322,0.825719,0.7616
train_cifar_b85f79ac,TERMINATED,172.28.0.12:21616,0.00825901,0.119263,10,58.8852,0.825457,0.737
train_cifar_63107a09,TERMINATED,172.28.0.12:21616,0.0255391,0.210218,10,62.4969,0.814002,0.756
train_cifar_dc6442a7,TERMINATED,172.28.0.12:21616,0.0733451,0.759311,10,60.5044,,0.1003
train_cifar_47e13a05,TERMINATED,172.28.0.12:21616,0.0962448,0.455211,10,59.2864,,0.0986


[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_683fcf7c_1_learning_rate=0.0533,momentum=0.5706_2023-04-13_07-29-08/data/cifar-10-python.tar.gz


[2m[36m(train_cifar pid=21616)[0m   0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:53, 360299.99it/s]
  0%|          | 229376/170498071 [00:00<04:11, 675733.28it/s]
  1%|          | 917504/170498071 [00:00<01:21, 2086203.77it/s]
  2%|▏         | 2752512/170498071 [00:00<00:26, 6362875.45it/s]
  3%|▎         | 5570560/170498071 [00:00<00:13, 12317752.66it/s]
  5%|▌         | 8978432/170498071 [00:00<00:08, 18415036.91it/s]
  7%|▋         | 12648448/170498071 [00:00<00:06, 23622808.33it/s]
  9%|▉         | 16056320/170498071 [00:01<00:05, 26641188.39it/s]
 11%|█▏        | 19333120/170498071 [00:01<00:06, 24862389.86it/s]
 14%|█▎        | 23068672/170498071 [00:01<00:05, 28159109.71it/s]
 16%|█▌        | 26574848/170498071 [00:01<00:04, 29304575.71it/s]
 18%|█▊        | 30277632/170498071 [00:01<00:04, 31432131.42it/s]
 20%|█▉        | 33980416/170498071 [00:01<00:04, 33008877.32it/s]
 22%|██▏       | 37552128/170498071 [00:01<00:04, 32945042.35

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_683fcf7c_1_learning_rate=0.0533,momentum=0.5706_2023-04-13_07-29-08/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_683fcf7c_1_learning_rate=0.0533,momentum=0.5706_2023-04-13_07-29-08/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified


Trial name,accuracy,date,done,episodes_total,experiment_id,experiment_tag,hostname,iterations_since_restore,loss,node_ip,pid,should_checkpoint,time_since_restore,time_this_iter_s,time_total_s,timestamp,timesteps_since_restore,timesteps_total,training_iteration,trial_id,warmup_time
train_cifar_055f429e,0.7594,2023-04-13_07-34-15,True,,5a843aadb3794948bfd80fe491aa1888,"5_learning_rate=0.0347,momentum=0.5038",ed1eb21d0f80,10,0.842427,172.28.0.12,21616,True,60.0488,4.96094,60.0488,1681371255,0,,10,055f429e,0.00421739
train_cifar_05fba8d5,0.6613,2023-04-13_07-57-42,True,,5a843aadb3794948bfd80fe491aa1888,"28_learning_rate=0.0010,momentum=0.1000",ed1eb21d0f80,10,0.98104,172.28.0.12,21616,True,61.6278,4.98777,61.6278,1681372662,0,,10,05fba8d5,0.00421739
train_cifar_21a435ff,0.7591,2023-04-13_07-49-24,True,,5a843aadb3794948bfd80fe491aa1888,"20_learning_rate=0.0152,momentum=0.9000",ed1eb21d0f80,10,0.829659,172.28.0.12,21616,True,59.3178,4.96435,59.3178,1681372164,0,,10,21a435ff,0.00421739
train_cifar_22b5e68d,0.6661,2023-04-13_07-56-40,True,,5a843aadb3794948bfd80fe491aa1888,"27_learning_rate=0.0010,momentum=0.1000",ed1eb21d0f80,10,0.957105,172.28.0.12,21616,True,73.4537,4.89127,73.4537,1681372600,0,,10,22b5e68d,0.00421739
train_cifar_259d1be5,0.1011,2023-04-13_07-33-15,True,,5a843aadb3794948bfd80fe491aa1888,"4_learning_rate=0.0867,momentum=0.6246",ed1eb21d0f80,10,,172.28.0.12,21616,True,61.4143,5.01028,61.4143,1681371195,0,,10,259d1be5,0.00421739
train_cifar_26ad1bb6,0.7448,2023-04-13_07-48-25,True,,5a843aadb3794948bfd80fe491aa1888,"19_learning_rate=0.0376,momentum=0.9000",ed1eb21d0f80,10,0.76854,172.28.0.12,21616,True,59.0038,4.93554,59.0038,1681372105,0,,10,26ad1bb6,0.00421739
train_cifar_2c66be32,0.7622,2023-04-13_07-46-25,True,,5a843aadb3794948bfd80fe491aa1888,"17_learning_rate=0.0371,momentum=0.1000",ed1eb21d0f80,10,0.805857,172.28.0.12,21616,True,60.0794,5.0006,60.0794,1681371985,0,,10,2c66be32,0.00421739
train_cifar_32a9852d,0.7589,2023-04-13_07-43-20,True,,5a843aadb3794948bfd80fe491aa1888,"14_learning_rate=0.0186,momentum=0.1000",ed1eb21d0f80,10,0.778791,172.28.0.12,21616,True,62.2223,4.98443,62.2223,1681371800,0,,10,32a9852d,0.00421739
train_cifar_3bd26127,0.7501,2023-04-13_07-50-24,True,,5a843aadb3794948bfd80fe491aa1888,"21_learning_rate=0.0152,momentum=0.9000",ed1eb21d0f80,10,0.891411,172.28.0.12,21616,True,59.1667,5.04606,59.1667,1681372224,0,,10,3bd26127,0.00421739
train_cifar_4613e3c4,0.7371,2023-04-13_07-41-16,True,,5a843aadb3794948bfd80fe491aa1888,"12_learning_rate=0.0479,momentum=0.7562",ed1eb21d0f80,10,0.841592,172.28.0.12,21616,True,59.0522,4.8759,59.0522,1681371676,0,,10,4613e3c4,0.00421739


[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_58540319_2_learning_rate=0.0282,momentum=0.3385_2023-04-13_07-30-14/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:57, 356916.62it/s]
  0%|          | 229376/170498071 [00:00<04:13, 672090.48it/s]
  0%|          | 688128/170498071 [00:00<01:29, 1899923.71it/s]
  1%|          | 1638400/170498071 [00:00<00:39, 4249262.85it/s]
  2%|▏         | 3702784/170498071 [00:00<00:21, 7625385.45it/s]
  4%|▍         | 7077888/170498071 [00:00<00:11, 14500639.75it/s]
  6%|▋         | 10780672/170498071 [00:00<00:07, 20662230.52it/s]
  8%|▊         | 14319616/170498071 [00:01<00:06, 24107455.00it/s]
 10%|█         | 17596416/170498071 [00:01<00:05, 26500781.41it/s]
 12%|█▏        | 21200896/170498071 [00:01<00:05, 29226309.85it/s]
 15%|█▍        | 24870912/170498071 [00:01<00:04, 31363210.97it/s]
 17%|█▋        | 28344320/170498071 [00:01<00:04, 29458303.35it/s]
 19%|█▊        | 31588352/170498071 [00:01<00:04, 30249293.47it/s]
 20%|██        | 34799616/170498071 [00:01<00:04, 30610986.60it/s]
 22%|██▏       | 37945344/1704980

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_58540319_2_learning_rate=0.0282,momentum=0.3385_2023-04-13_07-30-14/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_58540319_2_learning_rate=0.0282,momentum=0.3385_2023-04-13_07-30-14/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_d060044d_3_learning_rate=0.0133,momentum=0.6052_2023-04-13_07-31-14/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:22, 339075.39it/s]
  0%|          | 163840/170498071 [00:00<04:45, 596202.54it/s]
  0%|          | 360448/170498071 [00:00<02:37, 1080743.16it/s]
  0%|          | 720896/170498071 [00:00<01:28, 1921098.45it/s]
  1%|          | 1540096/170498071 [00:00<00:42, 3942502.54it/s]
  2%|▏         | 3080192/170498071 [00:00<00:22, 7554650.76it/s]
  3%|▎         | 5537792/170498071 [00:00<00:12, 12766405.86it/s]
  5%|▍         | 8028160/170498071 [00:00<00:09, 16409882.69it/s]
  6%|▌         | 10551296/170498071 [00:01<00:08, 18989215.41it/s]
  8%|▊         | 13271040/170498071 [00:01<00:07, 21461842.90it/s]
  9%|▉         | 15564800/170498071 [00:01<00:07, 21890789.78it/s]
 11%|█         | 18087936/170498071 [00:01<00:06, 22864189.49it/s]
 12%|█▏        | 20447232/170498071 [00:01<00:06, 23042696.30it/s]
 13%|█▎        | 22970368/170498071 [00:01<00:06, 23688689.02it/s]
 15%|█▍        | 25362432/170498071 [

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_d060044d_3_learning_rate=0.0133,momentum=0.6052_2023-04-13_07-31-14/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_d060044d_3_learning_rate=0.0133,momentum=0.6052_2023-04-13_07-31-14/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_259d1be5_4_learning_rate=0.0867,momentum=0.6246_2023-04-13_07-32-14/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:59, 355715.73it/s]
  0%|          | 229376/170498071 [00:00<04:14, 668479.33it/s]
  1%|          | 917504/170498071 [00:00<01:22, 2064891.12it/s]
  1%|▏         | 2523136/170498071 [00:00<00:29, 5717144.39it/s]
  3%|▎         | 5111808/170498071 [00:00<00:14, 11189596.87it/s]
  5%|▌         | 8552448/170498071 [00:00<00:09, 17665110.87it/s]
  7%|▋         | 11993088/170498071 [00:00<00:07, 22412504.74it/s]
  9%|▉         | 15466496/170498071 [00:01<00:05, 25961892.53it/s]
 11%|█         | 18808832/170498071 [00:01<00:05, 28140974.60it/s]
 13%|█▎        | 22315008/170498071 [00:01<00:04, 30161921.70it/s]
 15%|█▍        | 25526272/170498071 [00:01<00:05, 28188320.94it/s]
 17%|█▋        | 28868608/170498071 [00:01<00:04, 29607409.63it/s]
 19%|█▉        | 32571392/170498071 [00:01<00:04, 31704797.28it/s]
 21%|██        | 35848192/170498071 [00:01<00:04, 29430082.30it/s]
 23%|██▎       | 39288832/170498

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_259d1be5_4_learning_rate=0.0867,momentum=0.6246_2023-04-13_07-32-14/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_259d1be5_4_learning_rate=0.0867,momentum=0.6246_2023-04-13_07-32-14/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_055f429e_5_learning_rate=0.0347,momentum=0.5038_2023-04-13_07-33-15/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:12, 345881.06it/s]
  0%|          | 229376/170498071 [00:00<04:13, 671491.01it/s]
  0%|          | 622592/170498071 [00:00<01:40, 1685309.48it/s]
  1%|          | 1376256/170498071 [00:00<00:48, 3477529.15it/s]
  2%|▏         | 3309568/170498071 [00:00<00:20, 8312300.32it/s]
  4%|▎         | 6029312/170498071 [00:00<00:11, 14039884.58it/s]
  5%|▌         | 9043968/170498071 [00:00<00:08, 18858236.92it/s]
  7%|▋         | 12353536/170498071 [00:00<00:06, 23068501.69it/s]
  9%|▉         | 15728640/170498071 [00:01<00:05, 26248906.23it/s]
 11%|█▏        | 19202048/170498071 [00:01<00:05, 27093547.84it/s]
 13%|█▎        | 22577152/170498071 [00:01<00:05, 28990782.15it/s]
 15%|█▌        | 25985024/170498071 [00:01<00:04, 30402331.74it/s]
 17%|█▋        | 29327360/170498071 [00:01<00:04, 30686037.90it/s]
 19%|█▉        | 32473088/170498071 [00:01<00:04, 30892888.31it/s]
 21%|██        | 35618816/17049807

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_055f429e_5_learning_rate=0.0347,momentum=0.5038_2023-04-13_07-33-15/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_055f429e_5_learning_rate=0.0347,momentum=0.5038_2023-04-13_07-33-15/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_c4b0e93b_6_learning_rate=0.0421,momentum=0.1625_2023-04-13_07-34-15/data/cifar-10-python.tar.gz


[2m[36m(train_cifar pid=21616)[0m   0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:57, 357092.35it/s]
  0%|          | 229376/170498071 [00:00<04:13, 671521.61it/s]
  1%|          | 917504/170498071 [00:00<01:21, 2070325.79it/s]
  1%|▏         | 2293760/170498071 [00:00<00:32, 5128055.97it/s]
  3%|▎         | 4849664/170498071 [00:00<00:15, 10657263.53it/s]
  5%|▍         | 8159232/170498071 [00:00<00:09, 16909358.93it/s]
  7%|▋         | 11698176/170498071 [00:00<00:07, 22160947.70it/s]
  9%|▉         | 15269888/170498071 [00:01<00:05, 26068749.92it/s]
 11%|█         | 18776064/170498071 [00:01<00:06, 25072854.04it/s]
 13%|█▎        | 21921792/170498071 [00:01<00:05, 26732949.80it/s]
 15%|█▍        | 25133056/170498071 [00:01<00:05, 28169362.22it/s]
 17%|█▋        | 28606464/170498071 [00:01<00:04, 30009369.00it/s]
 19%|█▉        | 32112640/170498071 [00:01<00:04, 31407866.55it/s]
 21%|██        | 35749888/170498071 [00:01<00:04, 31500281.28

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_c4b0e93b_6_learning_rate=0.0421,momentum=0.1625_2023-04-13_07-34-15/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_c4b0e93b_6_learning_rate=0.0421,momentum=0.1625_2023-04-13_07-34-15/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_b85f79ac_7_learning_rate=0.0083,momentum=0.1193_2023-04-13_07-35-15/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:52, 361027.81it/s]
  0%|          | 229376/170498071 [00:00<04:10, 679328.25it/s]
  1%|          | 917504/170498071 [00:00<01:20, 2099010.78it/s]
  2%|▏         | 2916352/170498071 [00:00<00:24, 6823074.28it/s]
  3%|▎         | 5636096/170498071 [00:00<00:13, 12403721.07it/s]
  5%|▌         | 9273344/170498071 [00:00<00:08, 19134599.93it/s]
  7%|▋         | 12681216/170498071 [00:01<00:07, 20020363.05it/s]
  9%|▉         | 15990784/170498071 [00:01<00:06, 23247260.94it/s]
 12%|█▏        | 19726336/170498071 [00:01<00:05, 27034560.61it/s]
 14%|█▍        | 23461888/170498071 [00:01<00:04, 29880230.58it/s]
 16%|█▌        | 27197440/170498071 [00:01<00:04, 31976913.27it/s]
 18%|█▊        | 30965760/170498071 [00:01<00:04, 33605664.83it/s]
 20%|██        | 34471936/170498071 [00:01<00:04, 31305162.91it/s]
 22%|██▏       | 37715968/170498071 [00:01<00:04, 31092406.93it/s]
 24%|██▍       | 41320448/170498

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_b85f79ac_7_learning_rate=0.0083,momentum=0.1193_2023-04-13_07-35-15/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_b85f79ac_7_learning_rate=0.0083,momentum=0.1193_2023-04-13_07-35-15/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_63107a09_8_learning_rate=0.0255,momentum=0.2102_2023-04-13_07-36-14/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:25, 337100.20it/s]
  0%|          | 163840/170498071 [00:00<04:46, 593576.72it/s]
  0%|          | 327680/170498071 [00:00<02:57, 958880.33it/s]
  0%|          | 720896/170498071 [00:00<01:26, 1961133.38it/s]
  1%|          | 1114112/170498071 [00:00<01:06, 2551640.71it/s]
  1%|          | 1605632/170498071 [00:00<00:52, 3240923.87it/s]
  1%|          | 2097152/170498071 [00:00<00:45, 3741001.80it/s]
  2%|▏         | 2654208/170498071 [00:00<00:39, 4225012.77it/s]
  2%|▏         | 3211264/170498071 [00:01<00:36, 4581520.45it/s]
  2%|▏         | 3801088/170498071 [00:01<00:33, 4910271.47it/s]
  3%|▎         | 4423680/170498071 [00:01<00:31, 5278783.70it/s]
  3%|▎         | 5079040/170498071 [00:01<00:29, 5626813.50it/s]
  3%|▎         | 5767168/170498071 [00:01<00:27, 5994961.25it/s]
  4%|▍         | 6520832/170498071 [00:01<00:25, 6403136.98it/s]
  4%|▍         | 7307264/170498071 [00:01<00:24, 673

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_63107a09_8_learning_rate=0.0255,momentum=0.2102_2023-04-13_07-36-14/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_63107a09_8_learning_rate=0.0255,momentum=0.2102_2023-04-13_07-36-14/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_dc6442a7_9_learning_rate=0.0733,momentum=0.7593_2023-04-13_07-37-17/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:59, 355597.46it/s]
  0%|          | 131072/170498071 [00:00<05:55, 478744.93it/s]
  0%|          | 360448/170498071 [00:00<02:28, 1141941.53it/s]
  0%|          | 819200/170498071 [00:00<01:12, 2325169.37it/s]
  1%|          | 1671168/170498071 [00:00<00:38, 4369095.50it/s]
  2%|▏         | 3112960/170498071 [00:00<00:22, 7509683.70it/s]
  3%|▎         | 4849664/170498071 [00:00<00:15, 10566107.18it/s]
  4%|▍         | 7045120/170498071 [00:00<00:11, 14061851.34it/s]
  5%|▌         | 9043968/170498071 [00:01<00:10, 15818631.84it/s]
  7%|▋         | 11370496/170498071 [00:01<00:08, 17970223.40it/s]
  8%|▊         | 13664256/170498071 [00:01<00:08, 19460990.22it/s]
  9%|▉         | 16187392/170498071 [00:01<00:07, 21175894.36it/s]
 11%|█         | 18644992/170498071 [00:01<00:06, 22102807.02it/s]
 13%|█▎        | 21397504/170498071 [00:01<00:06, 23640057.69it/s]
 14%|█▍        | 23822336/170498071 [0

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_dc6442a7_9_learning_rate=0.0733,momentum=0.7593_2023-04-13_07-37-17/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_dc6442a7_9_learning_rate=0.0733,momentum=0.7593_2023-04-13_07-37-17/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_47e13a05_10_learning_rate=0.0962,momentum=0.4552_2023-04-13_07-38-17/data/cifar-10-python.tar.gz


[2m[36m(train_cifar pid=21616)[0m   0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:58, 356430.67it/s]
  0%|          | 229376/170498071 [00:00<04:14, 669612.11it/s]
  1%|          | 884736/170498071 [00:00<01:07, 2509798.40it/s]
  1%|          | 1835008/170498071 [00:00<00:44, 3778744.67it/s]
  3%|▎         | 4423680/170498071 [00:00<00:17, 9595178.57it/s]
  5%|▍         | 8093696/170498071 [00:00<00:09, 16999305.63it/s]
  7%|▋         | 11403264/170498071 [00:00<00:07, 21499284.11it/s]
  9%|▊         | 14876672/170498071 [00:01<00:06, 25285098.20it/s]
 11%|█         | 18153472/170498071 [00:01<00:05, 27380307.93it/s]
 13%|█▎        | 21495808/170498071 [00:01<00:05, 29146364.03it/s]
 15%|█▍        | 25165824/170498071 [00:01<00:04, 31314017.91it/s]
 17%|█▋        | 28409856/170498071 [00:01<00:04, 28678203.35it/s]
 19%|█▊        | 31686656/170498071 [00:01<00:04, 29769503.16it/s]
 20%|██        | 34865152/170498071 [00:01<00:04, 30036272.45i

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_47e13a05_10_learning_rate=0.0962,momentum=0.4552_2023-04-13_07-38-17/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_47e13a05_10_learning_rate=0.0962,momentum=0.4552_2023-04-13_07-38-17/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_67baef99_11_learning_rate=0.0407,momentum=0.3628_2023-04-13_07-39-17/data/cifar-10-python.tar.gz


[2m[36m(train_cifar pid=21616)[0m   0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:55, 358722.47it/s]
  0%|          | 229376/170498071 [00:00<04:12, 675038.64it/s]
  1%|          | 917504/170498071 [00:00<01:21, 2083478.56it/s]
  2%|▏         | 2719744/170498071 [00:00<00:26, 6269886.91it/s]
  3%|▎         | 4685824/170498071 [00:00<00:16, 9923188.58it/s]
  5%|▍         | 7766016/170498071 [00:00<00:10, 15741972.27it/s]
  6%|▋         | 11010048/170498071 [00:00<00:07, 20508164.73it/s]
  8%|▊         | 14254080/170498071 [00:01<00:06, 23949985.40it/s]
 10%|█         | 17760256/170498071 [00:01<00:05, 26645391.27it/s]
 12%|█▏        | 21135360/170498071 [00:01<00:05, 28706840.10it/s]
 14%|█▍        | 24412160/170498071 [00:01<00:04, 29895118.83it/s]
 16%|█▌        | 27557888/170498071 [00:01<00:04, 30247010.39it/s]
 18%|█▊        | 31096832/170498071 [00:01<00:04, 31759478.09it/s]
 20%|██        | 34406400/170498071 [00:01<00:04, 32080982.51i

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_67baef99_11_learning_rate=0.0407,momentum=0.3628_2023-04-13_07-39-17/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_67baef99_11_learning_rate=0.0407,momentum=0.3628_2023-04-13_07-39-17/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_4613e3c4_12_learning_rate=0.0479,momentum=0.7562_2023-04-13_07-40-17/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:58, 356438.99it/s]
  0%|          | 229376/170498071 [00:00<04:13, 671303.95it/s]
  1%|          | 917504/170498071 [00:00<01:21, 2073124.74it/s]
  2%|▏         | 2654208/170498071 [00:00<00:27, 6074104.10it/s]
  3%|▎         | 5439488/170498071 [00:00<00:13, 11992324.81it/s]
  5%|▌         | 8749056/170498071 [00:00<00:09, 17884987.48it/s]
  7%|▋         | 12222464/170498071 [00:00<00:06, 22692193.20it/s]
  9%|▉         | 15761408/170498071 [00:01<00:05, 26353296.66it/s]
 11%|█         | 18907136/170498071 [00:01<00:06, 24538420.38it/s]
 13%|█▎        | 22347776/170498071 [00:01<00:05, 27152397.90it/s]
 15%|█▌        | 25657344/170498071 [00:01<00:05, 28738605.67it/s]
 17%|█▋        | 29032448/170498071 [00:01<00:04, 29732889.05it/s]
 19%|█▉        | 32276480/170498071 [00:01<00:04, 30481825.94it/s]
 21%|██        | 35880960/170498071 [00:01<00:04, 32085558.48it/s]
 23%|██▎       | 39485440/170498

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_4613e3c4_12_learning_rate=0.0479,momentum=0.7562_2023-04-13_07-40-17/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_4613e3c4_12_learning_rate=0.0479,momentum=0.7562_2023-04-13_07-40-17/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_7cf2fc52_13_learning_rate=0.0010,momentum=0.9000_2023-04-13_07-41-16/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:06, 350264.67it/s]
  0%|          | 229376/170498071 [00:00<04:17, 661032.64it/s]
  0%|          | 753664/170498071 [00:00<01:21, 2082156.40it/s]
  1%|          | 1736704/170498071 [00:00<00:37, 4441329.82it/s]
  2%|▏         | 3506176/170498071 [00:00<00:19, 8464224.12it/s]
  4%|▎         | 6225920/170498071 [00:00<00:11, 14122371.11it/s]
  5%|▌         | 9240576/170498071 [00:00<00:08, 18946309.92it/s]
  7%|▋         | 12648448/170498071 [00:00<00:06, 23483694.36it/s]
  9%|▉         | 15958016/170498071 [00:01<00:05, 26357135.21it/s]
 11%|█▏        | 19267584/170498071 [00:01<00:05, 25485409.55it/s]
 13%|█▎        | 22544384/170498071 [00:01<00:05, 27459045.93it/s]
 15%|█▌        | 25690112/170498071 [00:01<00:05, 28384655.81it/s]
 17%|█▋        | 28803072/170498071 [00:01<00:05, 27838107.09it/s]
 19%|█▊        | 31948800/170498071 [00:01<00:04, 28831075.68it/s]
 21%|██        | 35291136/17049807

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_7cf2fc52_13_learning_rate=0.0010,momentum=0.9000_2023-04-13_07-41-16/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_7cf2fc52_13_learning_rate=0.0010,momentum=0.9000_2023-04-13_07-41-16/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_32a9852d_14_learning_rate=0.0186,momentum=0.1000_2023-04-13_07-42-18/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:22, 339023.11it/s]
  0%|          | 163840/170498071 [00:00<04:46, 594726.43it/s]
  0%|          | 327680/170498071 [00:00<02:56, 963731.45it/s]
  0%|          | 688128/170498071 [00:00<01:32, 1835035.32it/s]
  1%|          | 1474560/170498071 [00:00<00:44, 3778682.69it/s]
  1%|▏         | 2195456/170498071 [00:00<00:34, 4841573.27it/s]
  2%|▏         | 3080192/170498071 [00:00<00:27, 6036086.22it/s]
  2%|▏         | 4063232/170498071 [00:00<00:23, 7188979.66it/s]
  3%|▎         | 5111808/170498071 [00:01<00:20, 8140927.76it/s]
  4%|▎         | 6127616/170498071 [00:01<00:18, 8744740.15it/s]
  4%|▍         | 7307264/170498071 [00:01<00:17, 9590926.22it/s]
  5%|▍         | 8519680/170498071 [00:01<00:15, 10332359.79it/s]
  6%|▌         | 9764864/170498071 [00:01<00:14, 10771155.35it/s]
  7%|▋         | 11108352/170498071 [00:01<00:13, 11532181.43it/s]
  7%|▋         | 12484608/170498071 [00:01<00:13

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_32a9852d_14_learning_rate=0.0186,momentum=0.1000_2023-04-13_07-42-18/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_32a9852d_14_learning_rate=0.0186,momentum=0.1000_2023-04-13_07-42-18/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_ff3a23f2_15_learning_rate=0.0191,momentum=0.1000_2023-04-13_07-43-21/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:18, 341698.39it/s]
  0%|          | 163840/170498071 [00:00<04:43, 600126.50it/s]
  0%|          | 327680/170498071 [00:00<02:54, 975197.81it/s]
  0%|          | 688128/170498071 [00:00<01:30, 1879022.37it/s]
  1%|          | 1179648/170498071 [00:00<00:59, 2835385.54it/s]
  1%|          | 1736704/170498071 [00:00<00:46, 3643985.18it/s]
  1%|▏         | 2326528/170498071 [00:00<00:39, 4287600.83it/s]
  2%|▏         | 2916352/170498071 [00:00<00:35, 4754666.43it/s]
  2%|▏         | 3538944/170498071 [00:01<00:32, 5159163.46it/s]
  2%|▏         | 4194304/170498071 [00:01<00:29, 5543979.82it/s]
  3%|▎         | 4915200/170498071 [00:01<00:27, 5988188.66it/s]
  3%|▎         | 5668864/170498071 [00:01<00:25, 6377240.67it/s]
  4%|▍         | 6455296/170498071 [00:01<00:24, 6778083.67it/s]
  4%|▍         | 7274496/170498071 [00:01<00:22, 7142570.59it/s]
  5%|▍         | 8159232/170498071 [00:01<00:21, 759

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_ff3a23f2_15_learning_rate=0.0191,momentum=0.1000_2023-04-13_07-43-21/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_ff3a23f2_15_learning_rate=0.0191,momentum=0.1000_2023-04-13_07-43-21/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_a8a3b0e7_16_learning_rate=0.0197,momentum=0.9000_2023-04-13_07-44-23/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:58, 356385.38it/s]
  0%|          | 229376/170498071 [00:00<04:13, 671423.76it/s]
  0%|          | 819200/170498071 [00:00<01:13, 2310798.37it/s]
  1%|          | 1835008/170498071 [00:00<00:43, 3838206.24it/s]
  3%|▎         | 4456448/170498071 [00:00<00:17, 9727920.64it/s]
  5%|▍         | 8028160/170498071 [00:00<00:09, 16829766.37it/s]
  7%|▋         | 11403264/170498071 [00:00<00:07, 21570068.24it/s]
  9%|▊         | 14909440/170498071 [00:01<00:06, 25421442.18it/s]
 11%|█         | 18219008/170498071 [00:01<00:05, 27625732.96it/s]
 15%|█▍        | 24903680/170498071 [00:01<00:04, 30644809.71it/s]
 17%|█▋        | 28180480/170498071 [00:01<00:05, 26816600.26it/s]
 19%|█▊        | 31686656/170498071 [00:01<00:04, 29000127.87it/s]
 21%|██        | 35028992/170498071 [00:01<00:04, 30213490.44it/s]
 23%|██▎       | 38567936/170498071 [00:01<00:04, 31656124.41it/s]
 25%|██▍       | 42008576/1704980

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_a8a3b0e7_16_learning_rate=0.0197,momentum=0.9000_2023-04-13_07-44-23/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_a8a3b0e7_16_learning_rate=0.0197,momentum=0.9000_2023-04-13_07-44-23/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_2c66be32_17_learning_rate=0.0371,momentum=0.1000_2023-04-13_07-45-25/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:53, 359617.91it/s]
  0%|          | 229376/170498071 [00:00<04:11, 676449.94it/s]
  1%|          | 917504/170498071 [00:00<01:21, 2089446.78it/s]
  2%|▏         | 2850816/170498071 [00:00<00:25, 6630098.56it/s]
  3%|▎         | 5701632/170498071 [00:00<00:13, 12608427.05it/s]
  5%|▌         | 9371648/170498071 [00:00<00:08, 19358892.57it/s]
  8%|▊         | 13074432/170498071 [00:01<00:07, 20970729.72it/s]
 10%|▉         | 16547840/170498071 [00:01<00:06, 24470333.72it/s]
 12%|█▏        | 19922944/170498071 [00:01<00:05, 26962939.35it/s]
 14%|█▎        | 23298048/170498071 [00:01<00:05, 28849098.90it/s]
 16%|█▌        | 27033600/170498071 [00:01<00:04, 31253411.84it/s]
 18%|█▊        | 30769152/170498071 [00:01<00:04, 32992065.06it/s]
 20%|██        | 34406400/170498071 [00:01<00:04, 33973232.97it/s]
 22%|██▏       | 37879808/170498071 [00:01<00:04, 31604288.25it/s]
 24%|██▍       | 41287680/170498

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_2c66be32_17_learning_rate=0.0371,momentum=0.1000_2023-04-13_07-45-25/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_2c66be32_17_learning_rate=0.0371,momentum=0.1000_2023-04-13_07-45-25/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_e2fce1b7_18_learning_rate=0.0372,momentum=0.1000_2023-04-13_07-46-26/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:18, 342071.32it/s]
  0%|          | 163840/170498071 [00:00<04:40, 608262.17it/s]
  0%|          | 425984/170498071 [00:00<02:05, 1360193.79it/s]
  1%|          | 917504/170498071 [00:00<01:18, 2149555.01it/s]
  1%|▏         | 2359296/170498071 [00:00<00:29, 5726540.97it/s]
  5%|▌         | 8781824/170498071 [00:00<00:08, 19298586.74it/s]
  7%|▋         | 12353536/170498071 [00:00<00:06, 24169701.11it/s]
  9%|▉         | 15958016/170498071 [00:01<00:05, 27701231.96it/s]
 11%|█▏        | 19365888/170498071 [00:01<00:05, 25921759.97it/s]
 13%|█▎        | 22577152/170498071 [00:01<00:05, 27561126.62it/s]
 15%|█▌        | 25853952/170498071 [00:01<00:04, 29004382.70it/s]
 17%|█▋        | 29130752/170498071 [00:01<00:04, 29984144.77it/s]
 19%|█▉        | 32342016/170498071 [00:01<00:04, 30567520.29it/s]
 21%|██        | 35586048/170498071 [00:01<00:04, 31038865.27it/s]
 23%|██▎       | 39124992/17049807

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_e2fce1b7_18_learning_rate=0.0372,momentum=0.1000_2023-04-13_07-46-26/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_e2fce1b7_18_learning_rate=0.0372,momentum=0.1000_2023-04-13_07-46-26/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_26ad1bb6_19_learning_rate=0.0376,momentum=0.9000_2023-04-13_07-47-26/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:13, 345254.61it/s]
  0%|          | 229376/170498071 [00:00<04:11, 677208.06it/s]
  0%|          | 622592/170498071 [00:00<01:40, 1693624.11it/s]
  1%|          | 1376256/170498071 [00:00<00:48, 3474677.01it/s]
  2%|▏         | 3047424/170498071 [00:00<00:22, 7502800.81it/s]
  3%|▎         | 5865472/170498071 [00:00<00:11, 13733169.24it/s]
  5%|▌         | 8945664/170498071 [00:00<00:08, 18845609.82it/s]
  7%|▋         | 12517376/170498071 [00:00<00:06, 23866770.80it/s]
  9%|▉         | 15958016/170498071 [00:01<00:05, 27024132.23it/s]
 11%|█▏        | 19202048/170498071 [00:01<00:05, 26912262.07it/s]
 13%|█▎        | 22511616/170498071 [00:01<00:05, 28686597.74it/s]
 15%|█▌        | 25886720/170498071 [00:01<00:05, 28849056.30it/s]
 17%|█▋        | 29458432/170498071 [00:01<00:04, 30735068.81it/s]
 19%|█▉        | 33161216/170498071 [00:01<00:04, 32494082.15it/s]
 21%|██▏       | 36470784/17049807

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_26ad1bb6_19_learning_rate=0.0376,momentum=0.9000_2023-04-13_07-47-26/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_26ad1bb6_19_learning_rate=0.0376,momentum=0.9000_2023-04-13_07-47-26/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_21a435ff_20_learning_rate=0.0152,momentum=0.9000_2023-04-13_07-48-25/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:01, 354014.25it/s]
  0%|          | 229376/170498071 [00:00<04:15, 665794.17it/s]
  1%|          | 917504/170498071 [00:00<01:22, 2055952.10it/s]
  1%|▏         | 2490368/170498071 [00:00<00:29, 5611067.91it/s]
  3%|▎         | 5341184/170498071 [00:00<00:13, 11807789.44it/s]
  5%|▌         | 8912896/170498071 [00:00<00:08, 18475567.36it/s]
  7%|▋         | 12517376/170498071 [00:00<00:06, 23424502.90it/s]
  9%|▉         | 15892480/170498071 [00:01<00:05, 26381636.95it/s]
 11%|█▏        | 19365888/170498071 [00:01<00:06, 25075476.01it/s]
 14%|█▎        | 23134208/170498071 [00:01<00:05, 28426627.17it/s]
 16%|█▌        | 26476544/170498071 [00:01<00:04, 29650964.24it/s]
 17%|█▋        | 29687808/170498071 [00:01<00:04, 29976813.84it/s]
 19%|█▉        | 32800768/170498071 [00:01<00:04, 30031549.88it/s]
 21%|██▏       | 36339712/170498071 [00:01<00:04, 31561900.43it/s]
 23%|██▎       | 39878656/170498

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_21a435ff_20_learning_rate=0.0152,momentum=0.9000_2023-04-13_07-48-25/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_21a435ff_20_learning_rate=0.0152,momentum=0.9000_2023-04-13_07-48-25/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_3bd26127_21_learning_rate=0.0152,momentum=0.9000_2023-04-13_07-49-25/data/cifar-10-python.tar.gz


[2m[36m(train_cifar pid=21616)[0m   0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:55, 358460.03it/s]
  0%|          | 229376/170498071 [00:00<04:12, 674741.57it/s]
  1%|          | 917504/170498071 [00:00<01:21, 2085450.60it/s]
  2%|▏         | 2686976/170498071 [00:00<00:27, 6188469.80it/s]
  3%|▎         | 5046272/170498071 [00:00<00:15, 10940101.52it/s]
  5%|▌         | 8683520/170498071 [00:00<00:08, 18067313.97it/s]
  7%|▋         | 11960320/170498071 [00:00<00:07, 22249900.67it/s]
  9%|▉         | 15335424/170498071 [00:01<00:06, 25521124.61it/s]
 11%|█         | 19005440/170498071 [00:01<00:05, 28769947.42it/s]
 13%|█▎        | 22347776/170498071 [00:01<00:05, 27564727.31it/s]
 15%|█▌        | 25788416/170498071 [00:01<00:04, 29417070.37it/s]
 17%|█▋        | 29327360/170498071 [00:01<00:04, 30819051.24it/s]
 19%|█▉        | 32571392/170498071 [00:01<00:04, 30334561.58it/s]
 21%|██        | 35749888/170498071 [00:01<00:04, 30507461.53

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_3bd26127_21_learning_rate=0.0152,momentum=0.9000_2023-04-13_07-49-25/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_3bd26127_21_learning_rate=0.0152,momentum=0.9000_2023-04-13_07-49-25/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_d403f6bf_22_learning_rate=0.0507,momentum=0.1000_2023-04-13_07-50-25/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:00, 354988.52it/s]
  0%|          | 229376/170498071 [00:00<04:13, 670803.94it/s]
  0%|          | 786432/170498071 [00:00<01:16, 2206426.64it/s]
  1%|          | 1572864/170498071 [00:00<00:53, 3186503.22it/s]
  2%|▏         | 3768320/170498071 [00:00<00:20, 8104821.60it/s]
  4%|▍         | 7274496/170498071 [00:00<00:10, 15443808.07it/s]
  6%|▌         | 10518528/170498071 [00:00<00:07, 20200600.35it/s]
  8%|▊         | 13893632/170498071 [00:01<00:06, 23321502.36it/s]
 10%|█         | 17203200/170498071 [00:01<00:05, 26060922.80it/s]
 12%|█▏        | 20774912/170498071 [00:01<00:05, 28823967.74it/s]
 14%|█▍        | 24215552/170498071 [00:01<00:04, 29808766.48it/s]
 16%|█▌        | 27459584/170498071 [00:01<00:05, 27742540.71it/s]
 18%|█▊        | 30965760/170498071 [00:01<00:04, 29532408.10it/s]
 20%|██        | 34275328/170498071 [00:01<00:04, 30525015.24it/s]
 22%|██▏       | 37912576/1704980

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_d403f6bf_22_learning_rate=0.0507,momentum=0.1000_2023-04-13_07-50-25/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_d403f6bf_22_learning_rate=0.0507,momentum=0.1000_2023-04-13_07-50-25/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_baecb875_23_learning_rate=0.0506,momentum=0.1000_2023-04-13_07-51-25/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:53, 359632.97it/s]
  0%|          | 229376/170498071 [00:00<04:11, 677254.84it/s]
  0%|          | 557056/170498071 [00:00<01:54, 1486842.90it/s]
  1%|          | 1146880/170498071 [00:00<00:59, 2831018.91it/s]
  1%|▏         | 2523136/170498071 [00:00<00:27, 6143003.40it/s]
  2%|▏         | 4128768/170498071 [00:00<00:18, 9102779.01it/s]
  4%|▎         | 6062080/170498071 [00:00<00:13, 12161160.30it/s]
  5%|▍         | 8126464/170498071 [00:00<00:11, 14576434.49it/s]
  6%|▌         | 10256384/170498071 [00:01<00:09, 16551020.20it/s]
  7%|▋         | 12484608/170498071 [00:01<00:08, 18258204.77it/s]
  9%|▊         | 14778368/170498071 [00:01<00:07, 19622525.12it/s]
 10%|█         | 17268736/170498071 [00:01<00:07, 21102669.22it/s]
 12%|█▏        | 19824640/170498071 [00:01<00:06, 22423421.33it/s]
 13%|█▎        | 22347776/170498071 [00:01<00:06, 23152542.08it/s]
 15%|█▍        | 24739840/170498071 

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_baecb875_23_learning_rate=0.0506,momentum=0.1000_2023-04-13_07-51-25/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_baecb875_23_learning_rate=0.0506,momentum=0.1000_2023-04-13_07-51-25/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_b7486034_24_learning_rate=0.0336,momentum=0.1000_2023-04-13_07-52-26/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:11, 346966.87it/s]
  0%|          | 229376/170498071 [00:00<04:17, 660696.35it/s]
  0%|          | 819200/170498071 [00:00<01:14, 2284016.82it/s]
  1%|          | 1835008/170498071 [00:00<00:44, 3804153.92it/s]
  2%|▏         | 4161536/170498071 [00:00<00:18, 8899094.86it/s]
  4%|▍         | 7307264/170498071 [00:00<00:10, 15032311.53it/s]
  6%|▌         | 10649600/170498071 [00:00<00:07, 20172464.73it/s]
  8%|▊         | 13795328/170498071 [00:01<00:06, 23388870.94it/s]
 10%|▉         | 16973824/170498071 [00:01<00:05, 25743996.68it/s]
 12%|█▏        | 20512768/170498071 [00:01<00:05, 28532193.64it/s]
 14%|█▍        | 23592960/170498071 [00:01<00:05, 28644730.44it/s]
 16%|█▌        | 26902528/170498071 [00:01<00:04, 29912014.70it/s]
 18%|█▊        | 30015488/170498071 [00:01<00:04, 30177190.84it/s]
 20%|█▉        | 33390592/170498071 [00:01<00:04, 31203924.59it/s]
 21%|██▏       | 36569088/1704980

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_b7486034_24_learning_rate=0.0336,momentum=0.1000_2023-04-13_07-52-26/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_b7486034_24_learning_rate=0.0336,momentum=0.1000_2023-04-13_07-52-26/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_b6a41d6d_25_learning_rate=0.0337,momentum=0.1000_2023-04-13_07-53-26/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:58, 356105.59it/s]
  0%|          | 229376/170498071 [00:00<04:14, 669776.39it/s]
  1%|          | 917504/170498071 [00:00<01:21, 2069205.03it/s]
  1%|▏         | 2555904/170498071 [00:00<00:28, 5811853.98it/s]
  3%|▎         | 5308416/170498071 [00:00<00:14, 11712308.08it/s]
  5%|▌         | 8978432/170498071 [00:00<00:08, 18701787.75it/s]
  7%|▋         | 11796480/170498071 [00:00<00:07, 21363549.91it/s]
  9%|▉         | 15237120/170498071 [00:01<00:06, 24858366.82it/s]
 11%|█         | 18710528/170498071 [00:01<00:05, 27667578.84it/s]
 13%|█▎        | 22216704/170498071 [00:01<00:04, 29820328.28it/s]
 15%|█▍        | 25395200/170498071 [00:01<00:05, 28123249.42it/s]
 17%|█▋        | 28803072/170498071 [00:01<00:04, 29756446.64it/s]
 19%|█▉        | 32178176/170498071 [00:01<00:04, 30843364.53it/s]
 21%|██        | 35422208/170498071 [00:01<00:04, 31268534.97it/s]
 23%|██▎       | 38699008/170498

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_b6a41d6d_25_learning_rate=0.0337,momentum=0.1000_2023-04-13_07-53-26/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_b6a41d6d_25_learning_rate=0.0337,momentum=0.1000_2023-04-13_07-53-26/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_78545bd2_26_learning_rate=0.0227,momentum=0.9000_2023-04-13_07-54-27/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:16, 343610.27it/s]
  0%|          | 163840/170498071 [00:00<04:35, 617385.32it/s]
  0%|          | 458752/170498071 [00:00<02:23, 1188038.77it/s]
  1%|          | 1277952/170498071 [00:00<00:51, 3284984.30it/s]
  2%|▏         | 3178496/170498071 [00:00<00:20, 7992343.60it/s]
  4%|▍         | 6488064/170498071 [00:00<00:10, 15503337.94it/s]
  6%|▌         | 9961472/170498071 [00:00<00:08, 18079498.62it/s]
  8%|▊         | 13500416/170498071 [00:01<00:06, 22602183.56it/s]
 10%|▉         | 16875520/170498071 [00:01<00:06, 25596781.13it/s]
 12%|█▏        | 20545536/170498071 [00:01<00:05, 28705879.16it/s]
 14%|█▍        | 24248320/170498071 [00:01<00:04, 31089798.83it/s]
 16%|█▋        | 27852800/170498071 [00:01<00:04, 32501972.31it/s]
 18%|█▊        | 31457280/170498071 [00:01<00:04, 33533809.38it/s]
 20%|██        | 34897920/170498071 [00:01<00:04, 31142023.97it/s]
 22%|██▏       | 38273024/17049807

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_78545bd2_26_learning_rate=0.0227,momentum=0.9000_2023-04-13_07-54-27/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_78545bd2_26_learning_rate=0.0227,momentum=0.9000_2023-04-13_07-54-27/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_22b5e68d_27_learning_rate=0.0010,momentum=0.1000_2023-04-13_07-55-26/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:11, 346911.25it/s]
  0%|          | 163840/170498071 [00:00<04:34, 620458.40it/s]
  0%|          | 327680/170498071 [00:00<02:49, 1001819.52it/s]
  0%|          | 655360/170498071 [00:00<01:35, 1787697.72it/s]
  1%|          | 1212416/170498071 [00:00<00:55, 3031363.31it/s]
  1%|          | 1933312/170498071 [00:00<00:38, 4333326.06it/s]
  2%|▏         | 2686976/170498071 [00:00<00:31, 5281321.85it/s]
  2%|▏         | 3407872/170498071 [00:00<00:28, 5866045.16it/s]
  2%|▏         | 4128768/170498071 [00:01<00:26, 6261122.17it/s]
  3%|▎         | 4882432/170498071 [00:01<00:25, 6584524.87it/s]
  3%|▎         | 5603328/170498071 [00:01<00:24, 6752176.75it/s]
  4%|▎         | 6356992/170498071 [00:01<00:23, 6918397.75it/s]
  4%|▍         | 7110656/170498071 [00:01<00:23, 7069100.80it/s]
  5%|▍         | 7897088/170498071 [00:01<00:22, 7223445.69it/s]
  5%|▌         | 8650752/170498071 [00:01<00:22, 72

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_22b5e68d_27_learning_rate=0.0010,momentum=0.1000_2023-04-13_07-55-26/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_22b5e68d_27_learning_rate=0.0010,momentum=0.1000_2023-04-13_07-55-26/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_05fba8d5_28_learning_rate=0.0010,momentum=0.1000_2023-04-13_07-56-40/data/cifar-10-python.tar.gz


  0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:18, 342212.28it/s]
  0%|          | 229376/170498071 [00:00<04:13, 670627.34it/s]
  0%|          | 524288/170498071 [00:00<02:04, 1370590.80it/s]
  1%|          | 1245184/170498071 [00:00<00:53, 3153455.20it/s]
  1%|▏         | 2424832/170498071 [00:00<00:29, 5779274.51it/s]
  3%|▎         | 4751360/170498071 [00:00<00:14, 11067030.60it/s]
  4%|▍         | 7503872/170498071 [00:00<00:10, 15982862.87it/s]
  6%|▌         | 9994240/170498071 [00:00<00:08, 18623156.27it/s]
  7%|▋         | 12779520/170498071 [00:01<00:07, 21368939.96it/s]
  9%|▉         | 15794176/170498071 [00:01<00:06, 23985752.00it/s]
 11%|█         | 18939904/170498071 [00:01<00:05, 26205686.54it/s]
 13%|█▎        | 22282240/170498071 [00:01<00:05, 28341849.41it/s]
 15%|█▍        | 25362432/170498071 [00:01<00:04, 29054011.03it/s]
 17%|█▋        | 28835840/170498071 [00:01<00:04, 30747913.89it/s]
 19%|█▊        | 31948800/170498071

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_05fba8d5_28_learning_rate=0.0010,momentum=0.1000_2023-04-13_07-56-40/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_05fba8d5_28_learning_rate=0.0010,momentum=0.1000_2023-04-13_07-56-40/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_49d6b556_29_learning_rate=0.0077,momentum=0.9000_2023-04-13_07-57-42/data/cifar-10-python.tar.gz


[2m[36m(train_cifar pid=21616)[0m   0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<08:04, 351791.94it/s]
  0%|          | 229376/170498071 [00:00<04:20, 654220.28it/s]
  0%|          | 622592/170498071 [00:00<01:42, 1662748.40it/s]
  1%|          | 1572864/170498071 [00:00<00:41, 4054615.84it/s]
  2%|▏         | 2588672/170498071 [00:00<00:28, 5896444.92it/s]
  3%|▎         | 5275648/170498071 [00:00<00:13, 12208023.76it/s]
  5%|▌         | 8683520/170498071 [00:00<00:08, 18776701.85it/s]
  7%|▋         | 11993088/170498071 [00:00<00:06, 23068419.98it/s]
  9%|▉         | 15368192/170498071 [00:01<00:05, 26237301.86it/s]
 11%|█         | 18743296/170498071 [00:01<00:05, 28470315.67it/s]
 13%|█▎        | 22249472/170498071 [00:01<00:04, 30436532.57it/s]
 15%|█▍        | 25395200/170498071 [00:01<00:04, 29367456.46it/s]
 17%|█▋        | 28704768/170498071 [00:01<00:04, 30295766.54it/s]
 19%|█▊        | 31883264/170498071 [00:01<00:04, 30648690.37it

[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_49d6b556_29_learning_rate=0.0077,momentum=0.9000_2023-04-13_07-57-42/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_49d6b556_29_learning_rate=0.0077,momentum=0.9000_2023-04-13_07-57-42/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training
[2m[36m(train_cifar pid=21616)[0m Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_f6e5aa1b_30_learning_rate=0.0072,momentum=0.9000_2023-04-13_07-58-43/data/cifar-10-python.tar.gz


[2m[36m(train_cifar pid=21616)[0m   0%|          | 0/170498071 [00:00<?, ?it/s]
  0%|          | 65536/170498071 [00:00<07:57, 356984.29it/s]
  0%|          | 131072/170498071 [00:00<05:49, 487231.92it/s]
  0%|          | 294912/170498071 [00:00<03:05, 918434.90it/s]
  0%|          | 688128/170498071 [00:00<01:26, 1962097.95it/s]
  1%|          | 1441792/170498071 [00:00<00:44, 3802597.19it/s]
  2%|▏         | 3080192/170498071 [00:00<00:21, 7793552.33it/s]
  3%|▎         | 5505024/170498071 [00:00<00:12, 12871192.89it/s]
  5%|▍         | 8454144/170498071 [00:00<00:09, 17952125.94it/s]
  7%|▋         | 11436032/170498071 [00:00<00:07, 21522984.71it/s]
  9%|▊         | 14778368/170498071 [00:01<00:06, 25122699.26it/s]
 11%|█         | 18251776/170498071 [00:01<00:05, 28009697.42it/s]
 13%|█▎        | 21659648/170498071 [00:01<00:04, 29791662.16it/s]
 15%|█▍        | 25001984/170498071 [00:01<00:04, 29462656.04it/s]
 17%|█▋        | 28311552/170498071 [00:01<00:04, 30092921.35it/s]


[2m[36m(train_cifar pid=21616)[0m Extracting /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_f6e5aa1b_30_learning_rate=0.0072,momentum=0.9000_2023-04-13_07-58-43/data/cifar-10-python.tar.gz to /root/ray_results/train_cifar_2023-04-13_07-29-08/train_cifar_f6e5aa1b_30_learning_rate=0.0072,momentum=0.9000_2023-04-13_07-58-43/data
[2m[36m(train_cifar pid=21616)[0m Files already downloaded and verified
[2m[36m(train_cifar pid=21616)[0m Finished Training


2023-04-13 07:59:43,849	INFO tune.py:798 -- Total run time: 1835.51 seconds (1835.47 seconds for the tuning loop).


Best trial config: {'learning_rate': 0.007197361830645431, 'momentum': 0.9}
Best trial final validation loss: 0.886002612341741
Best trial final validation accuracy: 0.7669
Files already downloaded and verified
Files already downloaded and verified
Best trial test set accuracy: 0.7372


In [50]:
final_df = results_df.drop(
    columns=[
        "should_checkpoint",
        "timesteps_total",
        "episodes_total",
        "training_iteration",
        "trial_id",
        "experiment_id",
        "date",
        "timestamp",
        "pid",
        "hostname",
        "node_ip",
        "time_since_restore",
        "timesteps_since_restore",
        "iterations_since_restore",
        "warmup_time",
        "logdir",
    ]
)
final_df.sort_values(by=['accuracy'], ascending=False).head(10)

Unnamed: 0,loss,accuracy,time_this_iter_s,done,time_total_s,config/learning_rate,config/momentum
19,0.665818,0.7707,4.944207,False,34.603192,0.015221,0.9
17,0.70911,0.7676,5.068652,False,44.615632,0.037195,0.1
29,0.886003,0.7669,5.039817,False,59.404519,0.007197,0.9
20,0.761133,0.7665,4.855726,False,49.241999,0.015193,0.9
7,0.755334,0.7661,4.920707,False,57.501354,0.025539,0.210218
16,0.688952,0.7656,4.912491,False,40.131042,0.037067,0.1
28,0.874712,0.7654,5.123604,False,60.627084,0.007662,0.9
22,0.725938,0.7652,4.895066,False,50.017725,0.050633,0.1
1,0.729516,0.7645,4.839552,False,44.469491,0.02821,0.338465
25,0.732522,0.7641,4.961905,False,44.074652,0.022682,0.9


In [51]:
final_df.sort_values(by=['accuracy']).head(10)

Unnamed: 0,loss,accuracy,time_this_iter_s,done,time_total_s,config/learning_rate,config/momentum
9,,0.0986,14.474193,False,14.474193,0.096245,0.455211
8,,0.1003,16.165922,False,16.165922,0.073345,0.759311
3,,0.1011,16.965347,False,16.965347,0.086741,0.624554
27,0.98104,0.6613,4.987771,False,61.627751,0.001,0.1
26,0.957105,0.6661,4.891266,False,73.453667,0.001,0.1
6,0.768737,0.7405,4.977035,False,44.075492,0.008259,0.119263
18,0.76854,0.7448,4.935539,False,59.00382,0.037597,0.9
12,0.859787,0.7461,4.955603,False,61.418235,0.001,0.9
11,0.766995,0.7497,5.116255,False,49.201387,0.047927,0.756176
14,0.745935,0.7569,4.99767,False,52.042447,0.019149,0.1
